diff --git a/.github/workflows/bundle-desktop-windows.yml b/.github/workflows/bundle-desktop-windows.yml index e82ab3d5ad4b..a657c11af581 100644 --- a/.github/workflows/bundle-desktop-windows.yml +++ b/.github/workflows/bundle-desktop-windows.yml @@ -1,6 +1,7 @@ name: "Bundle Desktop (Windows)" on: + workflow_dispatch: workflow_call: inputs: version: diff --git a/Cargo.lock b/Cargo.lock index b351444a38b5..cea87f982e1e 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -4170,7 +4170,7 @@ dependencies = [ [[package]] name = "goose" -version = "1.24.0" +version = "1.25.0" dependencies = [ "ahash", "anyhow", @@ -4266,7 +4266,7 @@ dependencies = [ [[package]] name = "goose-acp" -version = "1.24.0" +version = "1.25.0" dependencies = [ "agent-client-protocol-schema", "anyhow", @@ -4301,7 +4301,7 @@ dependencies = [ [[package]] name = "goose-cli" -version = "1.24.0" +version = "1.25.0" dependencies = [ "anstream", "anyhow", @@ -4351,7 +4351,7 @@ dependencies = [ [[package]] name = "goose-mcp" -version = "1.24.0" +version = "1.25.0" dependencies = [ "anyhow", "base64 0.22.1", @@ -4400,7 +4400,7 @@ dependencies = [ [[package]] name = "goose-server" -version = "1.24.0" +version = "1.25.0" dependencies = [ "anyhow", "axum 0.8.8", @@ -4446,7 +4446,7 @@ dependencies = [ [[package]] name = "goose-test" -version = "1.24.0" +version = "1.25.0" dependencies = [ "clap", "serde_json", @@ -4454,7 +4454,7 @@ dependencies = [ [[package]] name = "goose-test-support" -version = "1.24.0" +version = "1.25.0" dependencies = [ "axum 0.7.9", "rmcp 0.15.0", diff --git a/Cargo.toml b/Cargo.toml index 193a49791431..e3f344ff1d79 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -4,7 +4,7 @@ resolver = "2" [workspace.package] edition = "2021" -version = "1.24.0" +version = "1.25.0" authors = ["Block "] license = "Apache-2.0" repository = "https://github.com/block/goose" diff --git a/crates/goose-mcp/src/developer/rmcp_developer.rs b/crates/goose-mcp/src/developer/rmcp_developer.rs index e77b5b6883ae..006c5a9c175a 100644 --- a/crates/goose-mcp/src/developer/rmcp_developer.rs +++ b/crates/goose-mcp/src/developer/rmcp_developer.rs @@ -21,6 +21,8 @@ use rmcp::{ const WORKING_DIR_HEADER: &str = "agent-working-dir"; const SESSION_ID_HEADER: &str = "agent-session-id"; +pub const WORKING_DIR_PLACEHOLDER: &str = "{{WORKING_DIR}}"; + fn extract_working_dir_from_meta(meta: &Meta) -> Option { meta.0 .get(WORKING_DIR_HEADER) @@ -242,8 +244,6 @@ pub struct DeveloperServer { impl ServerHandler for DeveloperServer { #[allow(clippy::too_many_lines)] fn get_info(&self) -> ServerInfo { - // Get base instructions and working directory - let cwd = std::env::current_dir().expect("should have a current working dir"); let os = std::env::consts::OS; let in_container = Self::is_definitely_container(); @@ -268,7 +268,7 @@ impl ServerHandler for DeveloperServer { {container_info} "#, os=os, - cwd=cwd.to_string_lossy(), + cwd=WORKING_DIR_PLACEHOLDER, container_info=if in_container { "container: true" } else { "" }, }, _ => { @@ -295,7 +295,7 @@ impl ServerHandler for DeveloperServer { {container_info} "#, os=os, - cwd=cwd.to_string_lossy(), + cwd=WORKING_DIR_PLACEHOLDER, shell=shell_info, container_info=if in_container { "container: true" } else { "" }, } diff --git a/crates/goose-mcp/src/lib.rs b/crates/goose-mcp/src/lib.rs index f9c47a5b8203..e1077683c982 100644 --- a/crates/goose-mcp/src/lib.rs +++ b/crates/goose-mcp/src/lib.rs @@ -20,6 +20,7 @@ pub mod tutorial; pub use autovisualiser::AutoVisualiserRouter; pub use computercontroller::ComputerControllerServer; pub use developer::rmcp_developer::DeveloperServer; +pub use developer::rmcp_developer::WORKING_DIR_PLACEHOLDER; pub use memory::MemoryServer; pub use tutorial::TutorialServer; diff --git a/crates/goose-server/src/routes/recipe_utils.rs b/crates/goose-server/src/routes/recipe_utils.rs index ba068b732273..800283ddb46a 100644 --- a/crates/goose-server/src/routes/recipe_utils.rs +++ b/crates/goose-server/src/routes/recipe_utils.rs @@ -10,7 +10,9 @@ use crate::state::AppState; use anyhow::Result; use axum::http::StatusCode; use goose::agents::Agent; -use goose::recipe::build_recipe::{build_recipe_from_template, RecipeError}; +use goose::recipe::build_recipe::{ + build_recipe_from_template, resolve_sub_recipe_path, RecipeError, +}; use goose::recipe::local_recipes::{get_recipe_library_dir, list_local_recipes}; use goose::recipe::validate_recipe::validate_recipe_template_from_content; use goose::recipe::Recipe; @@ -44,13 +46,23 @@ pub fn short_id_from_path(path: &str) -> String { pub fn get_all_recipes_manifests() -> Result> { let recipes_with_path = list_local_recipes()?; let mut recipe_manifests_with_path = Vec::new(); - for (file_path, recipe) in recipes_with_path { + for (file_path, mut recipe) in recipes_with_path { let Ok(last_modified) = fs::metadata(file_path.clone()) .map(|m| chrono::DateTime::::from(m.modified().unwrap()).to_rfc3339()) else { continue; }; + if let Some(recipe_dir) = file_path.parent() { + if let Some(ref mut sub_recipes) = recipe.sub_recipes { + for sr in sub_recipes.iter_mut() { + if let Ok(resolved) = resolve_sub_recipe_path(&sr.path, recipe_dir) { + sr.path = resolved; + } + } + } + } + let manifest_with_path = RecipeManifest { id: short_id_from_path(file_path.to_string_lossy().as_ref()), recipe, @@ -126,10 +138,22 @@ pub async fn get_recipe_file_path_by_id( pub async fn load_recipe_by_id(state: &AppState, id: &str) -> Result { let path = get_recipe_file_path_by_id(state, id).await?; - Recipe::from_file_path(&path).map_err(|err| ErrorResponse { + let mut recipe = Recipe::from_file_path(&path).map_err(|err| ErrorResponse { message: format!("Failed to load recipe: {}", err), status: StatusCode::INTERNAL_SERVER_ERROR, - }) + })?; + + if let Some(recipe_dir) = path.parent() { + if let Some(ref mut sub_recipes) = recipe.sub_recipes { + for sr in sub_recipes.iter_mut() { + if let Ok(resolved) = resolve_sub_recipe_path(&sr.path, recipe_dir) { + sr.path = resolved; + } + } + } + } + + Ok(recipe) } pub async fn build_recipe_with_parameter_values( diff --git a/crates/goose/src/agents/agent.rs b/crates/goose/src/agents/agent.rs index 71fcb7931359..cce38d2922e3 100644 --- a/crates/goose/src/agents/agent.rs +++ b/crates/goose/src/agents/agent.rs @@ -646,7 +646,7 @@ impl Agent { } match agent_ref - .add_extension(config_clone, &session_id_clone) + .add_extension_inner(config_clone, &session_id_clone) .await { Ok(_) => ExtensionLoadResult { @@ -668,13 +668,43 @@ impl Agent { }) .collect::>(); - futures::future::join_all(extension_futures).await + let results = futures::future::join_all(extension_futures).await; + + // Persist once after all extensions are loaded + if results.iter().any(|r| r.success) { + if let Err(e) = self.persist_extension_state(&session_id).await { + warn!("Failed to persist extension state after bulk load: {}", e); + } + } + + results } pub async fn add_extension( &self, extension: ExtensionConfig, session_id: &str, + ) -> ExtensionResult<()> { + self.add_extension_inner(extension, session_id).await?; + + // Persist extension state after successful add + self.persist_extension_state(session_id) + .await + .map_err(|e| { + error!("Failed to persist extension state: {}", e); + crate::agents::extension::ExtensionError::SetupError(format!( + "Failed to persist extension state: {}", + e + )) + })?; + + Ok(()) + } + + async fn add_extension_inner( + &self, + extension: ExtensionConfig, + session_id: &str, ) -> ExtensionResult<()> { let session = self .config @@ -728,17 +758,6 @@ impl Agent { } } - // Persist extension state after successful add - self.persist_extension_state(session_id) - .await - .map_err(|e| { - error!("Failed to persist extension state: {}", e); - crate::agents::extension::ExtensionError::SetupError(format!( - "Failed to persist extension state: {}", - e - )) - })?; - Ok(()) } @@ -1695,7 +1714,15 @@ impl Agent { ) -> Result { tracing::info!("Starting recipe creation with {} messages", messages.len()); - let extensions_info = self.extension_manager.get_extensions_info().await; + let session = self + .config + .session_manager + .get_session(session_id, false) + .await?; + let extensions_info = self + .extension_manager + .get_extensions_info(&session.working_dir) + .await; tracing::debug!("Retrieved {} extensions info", extensions_info.len()); let (extension_count, tool_count) = self .extension_manager diff --git a/crates/goose/src/agents/extension_manager.rs b/crates/goose/src/agents/extension_manager.rs index 456bc9697e6d..d16f01b2181b 100644 --- a/crates/goose/src/agents/extension_manager.rs +++ b/crates/goose/src/agents/extension_manager.rs @@ -716,17 +716,17 @@ impl ExtensionManager { } /// Get extensions info for building the system prompt - pub async fn get_extensions_info(&self) -> Vec { + pub async fn get_extensions_info(&self, working_dir: &std::path::Path) -> Vec { + let working_dir_str = working_dir.to_string_lossy(); self.extensions .lock() .await .iter() .map(|(name, ext)| { - ExtensionInfo::new( - name, - ext.get_instructions().unwrap_or_default().as_str(), - ext.supports_resources(), - ) + let instructions = ext.get_instructions().unwrap_or_default(); + let instructions = + instructions.replace(goose_mcp::WORKING_DIR_PLACEHOLDER, &working_dir_str); + ExtensionInfo::new(name, &instructions, ext.supports_resources()) }) .collect() } diff --git a/crates/goose/src/agents/reply_parts.rs b/crates/goose/src/agents/reply_parts.rs index 54e6d81ae8ed..a220a843a657 100644 --- a/crates/goose/src/agents/reply_parts.rs +++ b/crates/goose/src/agents/reply_parts.rs @@ -162,7 +162,10 @@ impl Agent { tools.sort_by(|a, b| a.name.cmp(&b.name)); // Prepare system prompt - let extensions_info = self.extension_manager.get_extensions_info().await; + let extensions_info = self + .extension_manager + .get_extensions_info(working_dir) + .await; let (extension_count, tool_count) = self .extension_manager .get_extension_and_tool_counts(session_id) diff --git a/crates/goose/src/providers/canonical/data/canonical_mapping_report.json b/crates/goose/src/providers/canonical/data/canonical_mapping_report.json index 3d928d316f28..4256a5c7345e 100644 --- a/crates/goose/src/providers/canonical/data/canonical_mapping_report.json +++ b/crates/goose/src/providers/canonical/data/canonical_mapping_report.json @@ -1,5 +1,5 @@ { - "timestamp": "2026-02-13T17:38:00.310507+00:00", + "timestamp": "2026-02-23T18:23:49.176777+00:00", "unmapped_models": [ { "provider": "anthropic", @@ -65,6 +65,10 @@ "provider": "databricks", "model": "databricks-bge-large-en" }, + { + "provider": "databricks", + "model": "databricks-gemini-3-1-pro" + }, { "provider": "databricks", "model": "databricks-gemini-3-flash" @@ -101,6 +105,14 @@ "provider": "databricks", "model": "databricks-meta-llama-3-1-8b-instruct" }, + { + "provider": "databricks", + "model": "databricks-qwen3-embedding-0-6b" + }, + { + "provider": "databricks", + "model": "databricks-qwen3-next-80b-a3b-instruct" + }, { "provider": "databricks", "model": "dummy-model-ml-gp-endpoint" @@ -323,7 +335,11 @@ }, { "provider": "google", - "model": "gemini-exp-1206" + "model": "gemini-3.1-pro-preview" + }, + { + "provider": "google", + "model": "gemini-3.1-pro-preview-customtools" }, { "provider": "google", @@ -365,18 +381,10 @@ "provider": "google", "model": "imagen-4.0-generate-001" }, - { - "provider": "google", - "model": "imagen-4.0-generate-preview-06-06" - }, { "provider": "google", "model": "imagen-4.0-ultra-generate-001" }, - { - "provider": "google", - "model": "imagen-4.0-ultra-generate-preview-06-06" - }, { "provider": "google", "model": "nano-banana-pro-preview" @@ -573,10 +581,6 @@ "provider": "openai", "model": "babbage:ft-square-2023-02-28-14-48-38" }, - { - "provider": "openai", - "model": "chatgpt-4o-latest" - }, { "provider": "openai", "model": "chatgpt-image-latest" @@ -1529,6 +1533,30 @@ "provider": "openai", "model": "ft:gpt-4.1-mini-2025-04-14:square::BwjlIMor:ckpt-step-1018" }, + { + "provider": "openai", + "model": "ft:gpt-4.1-mini-2025-04-14:square:plat-completion:DAHA8Zfx:ckpt-step-58" + }, + { + "provider": "openai", + "model": "ft:gpt-4.1-mini-2025-04-14:square:plat-completion:DAHA9OcK" + }, + { + "provider": "openai", + "model": "ft:gpt-4.1-mini-2025-04-14:square:plat-completion:DAHA9hzA:ckpt-step-116" + }, + { + "provider": "openai", + "model": "ft:gpt-4.1-mini-2025-04-14:square:plat-ft:DA58ZIKa:ckpt-step-912" + }, + { + "provider": "openai", + "model": "ft:gpt-4.1-mini-2025-04-14:square:plat-ft:DA58a3A7:ckpt-step-1824" + }, + { + "provider": "openai", + "model": "ft:gpt-4.1-mini-2025-04-14:square:plat-ft:DA58aFG0" + }, { "provider": "openai", "model": "ft:gpt-4.1-nano-2025-04-14:square:qliao-plathelp-v1:CRNAywx8" @@ -2681,6 +2709,10 @@ "provider": "openai", "model": "gpt-audio" }, + { + "provider": "openai", + "model": "gpt-audio-1.5" + }, { "provider": "openai", "model": "gpt-audio-2025-08-28" @@ -2713,6 +2745,10 @@ "provider": "openai", "model": "gpt-realtime" }, + { + "provider": "openai", + "model": "gpt-realtime-1.5" + }, { "provider": "openai", "model": "gpt-realtime-2025-08-28" @@ -2769,14 +2805,58 @@ "provider": "openrouter", "model": "ai21/jamba-large-1.7" }, + { + "provider": "openrouter", + "model": "aion-labs/aion-1.0" + }, + { + "provider": "openrouter", + "model": "aion-labs/aion-1.0-mini" + }, + { + "provider": "openrouter", + "model": "aion-labs/aion-rp-llama-3.1-8b" + }, + { + "provider": "openrouter", + "model": "alfredpros/codellama-7b-instruct-solidity" + }, { "provider": "openrouter", "model": "alibaba/tongyi-deepresearch-30b-a3b" }, + { + "provider": "openrouter", + "model": "allenai/molmo-2-8b" + }, + { + "provider": "openrouter", + "model": "allenai/olmo-2-0325-32b-instruct" + }, + { + "provider": "openrouter", + "model": "allenai/olmo-3-32b-think" + }, + { + "provider": "openrouter", + "model": "allenai/olmo-3-7b-instruct" + }, + { + "provider": "openrouter", + "model": "allenai/olmo-3-7b-think" + }, { "provider": "openrouter", "model": "allenai/olmo-3.1-32b-instruct" }, + { + "provider": "openrouter", + "model": "allenai/olmo-3.1-32b-think" + }, + { + "provider": "openrouter", + "model": "alpindale/goliath-120b" + }, { "provider": "openrouter", "model": "amazon/nova-2-lite-v1" @@ -2799,15 +2879,23 @@ }, { "provider": "openrouter", - "model": "anthropic/claude-3-haiku" + "model": "anthracite-org/magnum-v4-72b" + }, + { + "provider": "openrouter", + "model": "anthropic/claude-3.7-sonnet:thinking" }, { "provider": "openrouter", - "model": "anthropic/claude-3.5-sonnet" + "model": "arcee-ai/coder-large" }, { "provider": "openrouter", - "model": "anthropic/claude-3.7-sonnet:thinking" + "model": "arcee-ai/maestro-reasoning" + }, + { + "provider": "openrouter", + "model": "arcee-ai/spotlight" }, { "provider": "openrouter", @@ -2821,10 +2909,22 @@ "provider": "openrouter", "model": "baidu/ernie-4.5-21b-a3b" }, + { + "provider": "openrouter", + "model": "baidu/ernie-4.5-21b-a3b-thinking" + }, + { + "provider": "openrouter", + "model": "baidu/ernie-4.5-300b-a47b" + }, { "provider": "openrouter", "model": "baidu/ernie-4.5-vl-28b-a3b" }, + { + "provider": "openrouter", + "model": "baidu/ernie-4.5-vl-424b-a47b" + }, { "provider": "openrouter", "model": "bytedance-seed/seed-1.6" @@ -2835,15 +2935,15 @@ }, { "provider": "openrouter", - "model": "cohere/command-r-08-2024" + "model": "bytedance/ui-tars-1.5-7b" }, { "provider": "openrouter", - "model": "cohere/command-r-plus-08-2024" + "model": "cohere/command-a" }, { "provider": "openrouter", - "model": "deepseek/deepseek-chat" + "model": "deepcogito/cogito-v2.1-671b" }, { "provider": "openrouter", @@ -2853,10 +2953,22 @@ "provider": "openrouter", "model": "deepseek/deepseek-r1-0528" }, + { + "provider": "openrouter", + "model": "deepseek/deepseek-r1-distill-qwen-32b" + }, { "provider": "openrouter", "model": "deepseek/deepseek-v3.2-exp" }, + { + "provider": "openrouter", + "model": "eleutherai/llemma_7b" + }, + { + "provider": "openrouter", + "model": "essentialai/rnj-1-instruct" + }, { "provider": "openrouter", "model": "google/gemini-2.0-flash-lite-001" @@ -2865,6 +2977,26 @@ "provider": "openrouter", "model": "google/gemini-2.5-pro-preview" }, + { + "provider": "openrouter", + "model": "google/gemini-3-pro-image-preview" + }, + { + "provider": "openrouter", + "model": "google/gemini-3.1-pro-preview" + }, + { + "provider": "openrouter", + "model": "google/gemma-2-27b-it" + }, + { + "provider": "openrouter", + "model": "gryphe/mythomax-l2-13b" + }, + { + "provider": "openrouter", + "model": "ibm-granite/granite-4.0-h-micro" + }, { "provider": "openrouter", "model": "inception/mercury" @@ -2873,14 +3005,46 @@ "provider": "openrouter", "model": "inception/mercury-coder" }, + { + "provider": "openrouter", + "model": "inflection/inflection-3-pi" + }, + { + "provider": "openrouter", + "model": "inflection/inflection-3-productivity" + }, { "provider": "openrouter", "model": "kwaipilot/kat-coder-pro" }, + { + "provider": "openrouter", + "model": "liquid/lfm-2.2-6b" + }, + { + "provider": "openrouter", + "model": "liquid/lfm2-8b-a1b" + }, + { + "provider": "openrouter", + "model": "mancer/weaver" + }, + { + "provider": "openrouter", + "model": "meituan/longcat-flash-chat" + }, + { + "provider": "openrouter", + "model": "meta-llama/llama-3-70b-instruct" + }, { "provider": "openrouter", "model": "meta-llama/llama-3-8b-instruct" }, + { + "provider": "openrouter", + "model": "meta-llama/llama-3.1-405b" + }, { "provider": "openrouter", "model": "meta-llama/llama-3.1-405b-instruct" @@ -2895,7 +3059,11 @@ }, { "provider": "openrouter", - "model": "meta-llama/llama-3.3-70b-instruct" + "model": "meta-llama/llama-3.2-1b-instruct" + }, + { + "provider": "openrouter", + "model": "meta-llama/llama-3.2-3b-instruct" }, { "provider": "openrouter", @@ -2907,39 +3075,47 @@ }, { "provider": "openrouter", - "model": "minimax/minimax-m2.5" + "model": "meta-llama/llama-guard-2-8b" }, { "provider": "openrouter", - "model": "mistralai/ministral-14b-2512" + "model": "meta-llama/llama-guard-3-8b" + }, + { + "provider": "openrouter", + "model": "meta-llama/llama-guard-4-12b" + }, + { + "provider": "openrouter", + "model": "microsoft/phi-4" }, { "provider": "openrouter", - "model": "mistralai/ministral-3b-2512" + "model": "microsoft/wizardlm-2-8x22b" }, { "provider": "openrouter", - "model": "mistralai/ministral-8b-2512" + "model": "minimax/minimax-m2-her" }, { "provider": "openrouter", - "model": "mistralai/mistral-large" + "model": "mistralai/ministral-14b-2512" }, { "provider": "openrouter", - "model": "mistralai/mistral-large-2407" + "model": "mistralai/mistral-7b-instruct" }, { "provider": "openrouter", - "model": "mistralai/mistral-large-2411" + "model": "mistralai/mistral-7b-instruct-v0.1" }, { "provider": "openrouter", - "model": "mistralai/mistral-large-2512" + "model": "mistralai/mistral-7b-instruct-v0.2" }, { "provider": "openrouter", - "model": "mistralai/mistral-nemo" + "model": "mistralai/mistral-7b-instruct-v0.3" }, { "provider": "openrouter", @@ -2967,87 +3143,87 @@ }, { "provider": "openrouter", - "model": "mistralai/pixtral-large-2411" + "model": "mistralai/voxtral-small-24b-2507" }, { "provider": "openrouter", - "model": "mistralai/voxtral-small-24b-2507" + "model": "morph/morph-v3-fast" }, { "provider": "openrouter", - "model": "nex-agi/deepseek-v3.1-nex-n1" + "model": "morph/morph-v3-large" }, { "provider": "openrouter", - "model": "nousresearch/deephermes-3-mistral-24b-preview" + "model": "neversleep/llama-3.1-lumimaid-8b" }, { "provider": "openrouter", - "model": "nvidia/llama-3.1-nemotron-70b-instruct" + "model": "neversleep/noromaid-20b" }, { "provider": "openrouter", - "model": "nvidia/llama-3.3-nemotron-super-49b-v1.5" + "model": "nex-agi/deepseek-v3.1-nex-n1" }, { "provider": "openrouter", - "model": "nvidia/nemotron-3-nano-30b-a3b" + "model": "nousresearch/hermes-2-pro-llama-3-8b" }, { "provider": "openrouter", - "model": "openai/gpt-3.5-turbo" + "model": "nousresearch/hermes-3-llama-3.1-405b" }, { "provider": "openrouter", - "model": "openai/gpt-3.5-turbo-0613" + "model": "nousresearch/hermes-3-llama-3.1-70b" }, { "provider": "openrouter", - "model": "openai/gpt-3.5-turbo-16k" + "model": "nvidia/llama-3.1-nemotron-70b-instruct" }, { "provider": "openrouter", - "model": "openai/gpt-4" + "model": "nvidia/llama-3.1-nemotron-ultra-253b-v1" }, { "provider": "openrouter", - "model": "openai/gpt-4-0314" + "model": "nvidia/llama-3.3-nemotron-super-49b-v1.5" }, { "provider": "openrouter", - "model": "openai/gpt-4-1106-preview" + "model": "nvidia/nemotron-3-nano-30b-a3b" }, { "provider": "openrouter", - "model": "openai/gpt-4-turbo" + "model": "nvidia/nemotron-nano-12b-v2-vl" }, { "provider": "openrouter", - "model": "openai/gpt-4-turbo-preview" + "model": "openai/gpt-3.5-turbo-16k" }, { "provider": "openrouter", - "model": "openai/gpt-4.1-nano" + "model": "openai/gpt-3.5-turbo-instruct" }, { "provider": "openrouter", - "model": "openai/gpt-4o" + "model": "openai/gpt-4-1106-preview" }, { "provider": "openrouter", - "model": "openai/gpt-4o-2024-05-13" + "model": "openai/gpt-4-turbo-preview" }, { "provider": "openrouter", - "model": "openai/gpt-4o-2024-08-06" + "model": "openai/gpt-4o-audio-preview" }, { "provider": "openrouter", - "model": "openai/gpt-4o-2024-11-20" + "model": "openai/gpt-4o-mini-search-preview" }, { "provider": "openrouter", - "model": "openai/gpt-4o-audio-preview" + "model": "openai/gpt-4o-search-preview" }, { "provider": "openrouter", @@ -3059,51 +3235,55 @@ }, { "provider": "openrouter", - "model": "openai/o1" + "model": "openai/gpt-audio" }, { "provider": "openrouter", - "model": "openai/o3" + "model": "openai/gpt-audio-mini" }, { "provider": "openrouter", - "model": "openai/o3-deep-research" + "model": "openai/o3-mini-high" }, { "provider": "openrouter", - "model": "openai/o3-mini" + "model": "openai/o4-mini-high" }, { "provider": "openrouter", - "model": "openai/o3-mini-high" + "model": "opengvlab/internvl3-78b" }, { "provider": "openrouter", - "model": "openai/o3-pro" + "model": "openrouter/auto" }, { "provider": "openrouter", - "model": "openai/o4-mini-deep-research" + "model": "openrouter/bodybuilder" }, { "provider": "openrouter", - "model": "openai/o4-mini-high" + "model": "openrouter/free" }, { "provider": "openrouter", - "model": "openrouter/aurora-alpha" + "model": "perplexity/sonar" }, { "provider": "openrouter", - "model": "openrouter/auto" + "model": "perplexity/sonar-deep-research" }, { "provider": "openrouter", - "model": "openrouter/free" + "model": "perplexity/sonar-pro" + }, + { + "provider": "openrouter", + "model": "perplexity/sonar-pro-search" }, { "provider": "openrouter", - "model": "prime-intellect/intellect-3" + "model": "perplexity/sonar-reasoning-pro" }, { "provider": "openrouter", @@ -3113,6 +3293,10 @@ "provider": "openrouter", "model": "qwen/qwen-2.5-7b-instruct" }, + { + "provider": "openrouter", + "model": "qwen/qwen-2.5-vl-7b-instruct" + }, { "provider": "openrouter", "model": "qwen/qwen-max" @@ -3137,6 +3321,18 @@ "provider": "openrouter", "model": "qwen/qwen-vl-max" }, + { + "provider": "openrouter", + "model": "qwen/qwen-vl-plus" + }, + { + "provider": "openrouter", + "model": "qwen/qwen2.5-coder-7b-instruct" + }, + { + "provider": "openrouter", + "model": "qwen/qwen2.5-vl-32b-instruct" + }, { "provider": "openrouter", "model": "qwen/qwen3-14b" @@ -3157,10 +3353,6 @@ "provider": "openrouter", "model": "qwen/qwen3-32b" }, - { - "provider": "openrouter", - "model": "qwen/qwen3-4b" - }, { "provider": "openrouter", "model": "qwen/qwen3-8b" @@ -3209,6 +3401,14 @@ "provider": "openrouter", "model": "qwen/qwq-32b" }, + { + "provider": "openrouter", + "model": "raifle/sorcererlm-8x22b" + }, + { + "provider": "openrouter", + "model": "relace/relace-apply-3" + }, { "provider": "openrouter", "model": "relace/relace-search" @@ -3217,22 +3417,42 @@ "provider": "openrouter", "model": "sao10k/l3-euryale-70b" }, + { + "provider": "openrouter", + "model": "sao10k/l3-lunaris-8b" + }, + { + "provider": "openrouter", + "model": "sao10k/l3.1-70b-hanami-x1" + }, { "provider": "openrouter", "model": "sao10k/l3.1-euryale-70b" }, { "provider": "openrouter", - "model": "stepfun/step-3.5-flash" + "model": "sao10k/l3.3-euryale-70b" + }, + { + "provider": "openrouter", + "model": "switchpoint/router" + }, + { + "provider": "openrouter", + "model": "tencent/hunyuan-a13b-instruct" }, { "provider": "openrouter", - "model": "stepfun/step-3.5-flash:free" + "model": "thedrummer/cydonia-24b-v4.1" }, { "provider": "openrouter", "model": "thedrummer/rocinante-12b" }, + { + "provider": "openrouter", + "model": "thedrummer/skyfall-36b-v2" + }, { "provider": "openrouter", "model": "thedrummer/unslopnemo-12b" @@ -3243,12 +3463,16 @@ }, { "provider": "openrouter", - "model": "tngtech/tng-r1t-chimera" + "model": "undi95/remm-slerp-l2-13b" }, { "provider": "openrouter", "model": "upstage/solar-pro-3:free" }, + { + "provider": "openrouter", + "model": "writer/palmyra-x5" + }, { "provider": "openrouter", "model": "z-ai/glm-4-32b" @@ -3258,8 +3482,32 @@ "model": "z-ai/glm-4.6v" }, { - "provider": "openrouter", - "model": "z-ai/glm-5" + "provider": "tetrate", + "model": "chatgpt-4o-latest" + }, + { + "provider": "tetrate", + "model": "deepinfra/BAAI/bge-base-en-v1.5" + }, + { + "provider": "tetrate", + "model": "deepinfra/BAAI/bge-en-icl" + }, + { + "provider": "tetrate", + "model": "deepinfra/BAAI/bge-large-en-v1.5" + }, + { + "provider": "tetrate", + "model": "deepinfra/BAAI/bge-m3" + }, + { + "provider": "tetrate", + "model": "deepinfra/BAAI/bge-m3-multi" + }, + { + "provider": "tetrate", + "model": "deepinfra/Gryphe/MythoMax-L2-13b" }, { "provider": "tetrate", @@ -3273,10 +3521,18 @@ "provider": "tetrate", "model": "deepinfra/NousResearch/Hermes-3-Llama-3.1-70B" }, + { + "provider": "tetrate", + "model": "deepinfra/PaddlePaddle/PaddleOCR-VL-0.9B" + }, { "provider": "tetrate", "model": "deepinfra/Qwen/Qwen2.5-72B-Instruct" }, + { + "provider": "tetrate", + "model": "deepinfra/Qwen/Qwen2.5-VL-32B-Instruct" + }, { "provider": "tetrate", "model": "deepinfra/Qwen/Qwen3-14B" @@ -3307,27 +3563,75 @@ }, { "provider": "tetrate", - "model": "deepinfra/Qwen/Qwen3-Next-80B-A3B-Instruct" + "model": "deepinfra/Qwen/Qwen3-Embedding-0.6B" }, { "provider": "tetrate", - "model": "deepinfra/Qwen/Qwen3-VL-235B-A22B-Instruct" + "model": "deepinfra/Qwen/Qwen3-Embedding-0.6B-batch" }, { "provider": "tetrate", - "model": "deepinfra/Qwen/Qwen3-VL-30B-A3B-Instruct" + "model": "deepinfra/Qwen/Qwen3-Embedding-4B" }, { "provider": "tetrate", - "model": "deepinfra/deepseek-ai/DeepSeek-R1-0528" + "model": "deepinfra/Qwen/Qwen3-Embedding-4B-batch" }, { "provider": "tetrate", - "model": "deepinfra/deepseek-ai/DeepSeek-R1-0528-Turbo" + "model": "deepinfra/Qwen/Qwen3-Embedding-8B" }, { "provider": "tetrate", - "model": "deepinfra/deepseek-ai/DeepSeek-V3" + "model": "deepinfra/Qwen/Qwen3-Embedding-8B-batch" + }, + { + "provider": "tetrate", + "model": "deepinfra/Qwen/Qwen3-Next-80B-A3B-Instruct" + }, + { + "provider": "tetrate", + "model": "deepinfra/Qwen/Qwen3-VL-235B-A22B-Instruct" + }, + { + "provider": "tetrate", + "model": "deepinfra/Qwen/Qwen3-VL-30B-A3B-Instruct" + }, + { + "provider": "tetrate", + "model": "deepinfra/Sao10K/L3-8B-Lunaris-v1-Turbo" + }, + { + "provider": "tetrate", + "model": "deepinfra/Sao10K/L3.1-70B-Euryale-v2.2" + }, + { + "provider": "tetrate", + "model": "deepinfra/Sao10K/L3.3-70B-Euryale-v2.3" + }, + { + "provider": "tetrate", + "model": "deepinfra/allenai/olmOCR-2-7B-1025" + }, + { + "provider": "tetrate", + "model": "deepinfra/deepseek-ai/DeepSeek-OCR" + }, + { + "provider": "tetrate", + "model": "deepinfra/deepseek-ai/DeepSeek-R1-0528" + }, + { + "provider": "tetrate", + "model": "deepinfra/deepseek-ai/DeepSeek-R1-0528-Turbo" + }, + { + "provider": "tetrate", + "model": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B" + }, + { + "provider": "tetrate", + "model": "deepinfra/deepseek-ai/DeepSeek-V3" }, { "provider": "tetrate", @@ -3345,6 +3649,10 @@ "provider": "tetrate", "model": "deepinfra/deepseek-ai/DeepSeek-V3.2" }, + { + "provider": "tetrate", + "model": "deepinfra/google/embeddinggemma-300m" + }, { "provider": "tetrate", "model": "deepinfra/google/gemini-2.0-flash-001" @@ -3361,6 +3669,26 @@ "provider": "tetrate", "model": "deepinfra/google/gemma-3-4b-it" }, + { + "provider": "tetrate", + "model": "deepinfra/intfloat/e5-base-v2" + }, + { + "provider": "tetrate", + "model": "deepinfra/intfloat/e5-large-v2" + }, + { + "provider": "tetrate", + "model": "deepinfra/intfloat/multilingual-e5-large" + }, + { + "provider": "tetrate", + "model": "deepinfra/intfloat/multilingual-e5-large-instruct" + }, + { + "provider": "tetrate", + "model": "deepinfra/meta-llama/Llama-3.2-11B-Vision-Instruct" + }, { "provider": "tetrate", "model": "deepinfra/meta-llama/Llama-3.2-3B-Instruct" @@ -3369,6 +3697,10 @@ "provider": "tetrate", "model": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo" }, + { + "provider": "tetrate", + "model": "deepinfra/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8" + }, { "provider": "tetrate", "model": "deepinfra/meta-llama/Llama-4-Scout-17B-16E-Instruct" @@ -3393,6 +3725,14 @@ "provider": "tetrate", "model": "deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo" }, + { + "provider": "tetrate", + "model": "deepinfra/microsoft/WizardLM-2-8x22B" + }, + { + "provider": "tetrate", + "model": "deepinfra/microsoft/phi-4" + }, { "provider": "tetrate", "model": "deepinfra/mistralai/Mistral-Nemo-Instruct-2407" @@ -3425,6 +3765,10 @@ "provider": "tetrate", "model": "deepinfra/nvidia/Llama-3.3-Nemotron-Super-49B-v1.5" }, + { + "provider": "tetrate", + "model": "deepinfra/nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL" + }, { "provider": "tetrate", "model": "deepinfra/nvidia/NVIDIA-Nemotron-Nano-9B-v2" @@ -3445,6 +3789,46 @@ "provider": "tetrate", "model": "deepinfra/openai/gpt-oss-20b" }, + { + "provider": "tetrate", + "model": "deepinfra/sentence-transformers/all-MiniLM-L12-v2" + }, + { + "provider": "tetrate", + "model": "deepinfra/sentence-transformers/all-MiniLM-L6-v2" + }, + { + "provider": "tetrate", + "model": "deepinfra/sentence-transformers/all-mpnet-base-v2" + }, + { + "provider": "tetrate", + "model": "deepinfra/sentence-transformers/clip-ViT-B-32" + }, + { + "provider": "tetrate", + "model": "deepinfra/sentence-transformers/clip-ViT-B-32-multilingual-v1" + }, + { + "provider": "tetrate", + "model": "deepinfra/sentence-transformers/multi-qa-mpnet-base-dot-v1" + }, + { + "provider": "tetrate", + "model": "deepinfra/sentence-transformers/paraphrase-MiniLM-L6-v2" + }, + { + "provider": "tetrate", + "model": "deepinfra/shibing624/text2vec-base-chinese" + }, + { + "provider": "tetrate", + "model": "deepinfra/thenlper/gte-base" + }, + { + "provider": "tetrate", + "model": "deepinfra/thenlper/gte-large" + }, { "provider": "tetrate", "model": "deepinfra/zai-org/GLM-4.6" @@ -3465,6 +3849,26 @@ "provider": "tetrate", "model": "gemini-2.0-flash-lite-001" }, + { + "provider": "tetrate", + "model": "gemini-robotics-er-1.5-preview" + }, + { + "provider": "tetrate", + "model": "gpt-4o-mini-search-preview" + }, + { + "provider": "tetrate", + "model": "gpt-4o-mini-search-preview-2025-03-11" + }, + { + "provider": "tetrate", + "model": "gpt-4o-search-preview" + }, + { + "provider": "tetrate", + "model": "gpt-4o-search-preview-2025-03-11" + }, { "provider": "tetrate", "model": "groq/llama-3.1-8b-instant" @@ -3497,6 +3901,18 @@ "provider": "tetrate", "model": "groq/qwen/qwen3-32b" }, + { + "provider": "tetrate", + "model": "text-embedding-3-large" + }, + { + "provider": "tetrate", + "model": "text-embedding-3-small" + }, + { + "provider": "tetrate", + "model": "text-embedding-ada-002" + }, { "provider": "tetrate", "model": "xai/grok-3-beta" @@ -3536,14 +3952,6 @@ ], "all_mappings": { "anthropic": [ - { - "provider_model": "claude-3-5-haiku-20241022", - "canonical_model": "anthropic/claude-3.5-haiku" - }, - { - "provider_model": "claude-3-7-sonnet-20250219", - "canonical_model": "anthropic/claude-3.7-sonnet" - }, { "provider_model": "claude-3-haiku-20240307", "canonical_model": "anthropic/claude-3-haiku" @@ -3575,6 +3983,10 @@ { "provider_model": "claude-sonnet-4-5-20250929", "canonical_model": "anthropic/claude-sonnet-4.5" + }, + { + "provider_model": "claude-sonnet-4-6", + "canonical_model": "anthropic/claude-sonnet-4.6" } ], "aws_bedrock": [], @@ -3632,6 +4044,10 @@ "provider_model": "databricks-claude-sonnet-4-5", "canonical_model": "anthropic/claude-sonnet-4.5" }, + { + "provider_model": "databricks-claude-sonnet-4-6", + "canonical_model": "anthropic/claude-sonnet-4.6" + }, { "provider_model": "databricks-gemini-2-5-flash", "canonical_model": "google/gemini-2.5-flash" @@ -3856,6 +4272,10 @@ "provider_model": "kgoose-claude-haiku-4-5", "canonical_model": "anthropic/claude-haiku-4.5" }, + { + "provider_model": "kgoose-claude-opus-4-6", + "canonical_model": "anthropic/claude-opus-4.6" + }, { "provider_model": "kgoose-claude-sonnet-4-5", "canonical_model": "anthropic/claude-sonnet-4.5" @@ -3987,10 +4407,6 @@ "provider_model": "gemini-2.5-flash-lite-preview-09-2025", "canonical_model": "google/gemini-2.5-flash-lite-preview-09" }, - { - "provider_model": "gemini-2.5-flash-preview-09-2025", - "canonical_model": "google/gemini-2.5-flash-preview-09" - }, { "provider_model": "gemini-2.5-flash-preview-tts", "canonical_model": "google/gemini-2.5-flash-preview-tts" @@ -4271,10 +4687,18 @@ } ], "openrouter": [ + { + "provider_model": "anthropic/claude-3-haiku", + "canonical_model": "anthropic/claude-3-haiku" + }, { "provider_model": "anthropic/claude-3.5-haiku", "canonical_model": "openrouter/anthropic/claude-3.5-haiku" }, + { + "provider_model": "anthropic/claude-3.5-sonnet", + "canonical_model": "anthropic/claude-3.5-sonnet" + }, { "provider_model": "anthropic/claude-3.7-sonnet", "canonical_model": "openrouter/anthropic/claude-3.7-sonnet" @@ -4307,6 +4731,10 @@ "provider_model": "anthropic/claude-sonnet-4.5", "canonical_model": "openrouter/anthropic/claude-sonnet-4.5" }, + { + "provider_model": "anthropic/claude-sonnet-4.6", + "canonical_model": "anthropic/claude-sonnet-4.6" + }, { "provider_model": "arcee-ai/trinity-large-preview:free", "canonical_model": "openrouter/arcee-ai/trinity-large-preview:free" @@ -4315,6 +4743,26 @@ "provider_model": "arcee-ai/trinity-mini:free", "canonical_model": "openrouter/arcee-ai/trinity-mini:free" }, + { + "provider_model": "cognitivecomputations/dolphin-mistral-24b-venice-edition:free", + "canonical_model": "openrouter/cognitivecomputations/dolphin-mistral-24b-venice-edition:free" + }, + { + "provider_model": "cohere/command-r-08-2024", + "canonical_model": "cohere/command-r-08" + }, + { + "provider_model": "cohere/command-r-plus-08-2024", + "canonical_model": "cohere/command-r-plus-08" + }, + { + "provider_model": "cohere/command-r7b-12-2024", + "canonical_model": "cohere/command-r7b-12" + }, + { + "provider_model": "deepseek/deepseek-chat", + "canonical_model": "deepseek/deepseek-chat" + }, { "provider_model": "deepseek/deepseek-chat-v3-0324", "canonical_model": "openrouter/deepseek/deepseek-chat-v3" @@ -4323,6 +4771,14 @@ "provider_model": "deepseek/deepseek-chat-v3.1", "canonical_model": "openrouter/deepseek/deepseek-chat-v3.1" }, + { + "provider_model": "deepseek/deepseek-r1-0528:free", + "canonical_model": "openrouter/deepseek/deepseek-r1-0528:free" + }, + { + "provider_model": "deepseek/deepseek-r1-distill-llama-70b", + "canonical_model": "openrouter/deepseek/deepseek-r1-distill-llama-70b" + }, { "provider_model": "deepseek/deepseek-v3.1-terminus", "canonical_model": "openrouter/deepseek/deepseek-v3.1-terminus" @@ -4335,6 +4791,10 @@ "provider_model": "deepseek/deepseek-v3.2", "canonical_model": "openrouter/deepseek/deepseek-v3.2" }, + { + "provider_model": "deepseek/deepseek-v3.2-speciale", + "canonical_model": "openrouter/deepseek/deepseek-v3.2-speciale" + }, { "provider_model": "google/gemini-2.0-flash-001", "canonical_model": "openrouter/google/gemini-2.0-flash-001" @@ -4343,6 +4803,10 @@ "provider_model": "google/gemini-2.5-flash", "canonical_model": "openrouter/google/gemini-2.5-flash" }, + { + "provider_model": "google/gemini-2.5-flash-image", + "canonical_model": "google/gemini-2.5-flash-image" + }, { "provider_model": "google/gemini-2.5-flash-lite", "canonical_model": "openrouter/google/gemini-2.5-flash-lite" @@ -4351,10 +4815,6 @@ "provider_model": "google/gemini-2.5-flash-lite-preview-09-2025", "canonical_model": "openrouter/google/gemini-2.5-flash-lite-preview-09" }, - { - "provider_model": "google/gemini-2.5-flash-preview-09-2025", - "canonical_model": "openrouter/google/gemini-2.5-flash-preview-09" - }, { "provider_model": "google/gemini-2.5-pro", "canonical_model": "openrouter/google/gemini-2.5-pro" @@ -4371,6 +4831,18 @@ "provider_model": "google/gemini-3-pro-preview", "canonical_model": "openrouter/google/gemini-3-pro-preview" }, + { + "provider_model": "google/gemma-2-9b-it", + "canonical_model": "openrouter/google/gemma-2-9b-it" + }, + { + "provider_model": "google/gemma-3-12b-it", + "canonical_model": "openrouter/google/gemma-3-12b-it" + }, + { + "provider_model": "google/gemma-3-12b-it:free", + "canonical_model": "openrouter/google/gemma-3-12b-it:free" + }, { "provider_model": "google/gemma-3-27b-it", "canonical_model": "openrouter/google/gemma-3-27b-it" @@ -4379,10 +4851,54 @@ "provider_model": "google/gemma-3-27b-it:free", "canonical_model": "openrouter/google/gemma-3-27b-it:free" }, + { + "provider_model": "google/gemma-3-4b-it", + "canonical_model": "openrouter/google/gemma-3-4b-it" + }, + { + "provider_model": "google/gemma-3-4b-it:free", + "canonical_model": "openrouter/google/gemma-3-4b-it:free" + }, + { + "provider_model": "google/gemma-3n-e2b-it:free", + "canonical_model": "openrouter/google/gemma-3n-e2b-it:free" + }, + { + "provider_model": "google/gemma-3n-e4b-it", + "canonical_model": "openrouter/google/gemma-3n-e4b-it" + }, + { + "provider_model": "google/gemma-3n-e4b-it:free", + "canonical_model": "openrouter/google/gemma-3n-e4b-it:free" + }, + { + "provider_model": "liquid/lfm-2.5-1.2b-instruct:free", + "canonical_model": "openrouter/liquid/lfm-2.5-1.2b-instruct:free" + }, + { + "provider_model": "liquid/lfm-2.5-1.2b-thinking:free", + "canonical_model": "openrouter/liquid/lfm-2.5-1.2b-thinking:free" + }, + { + "provider_model": "meta-llama/llama-3.2-11b-vision-instruct", + "canonical_model": "openrouter/meta-llama/llama-3.2-11b-vision-instruct" + }, + { + "provider_model": "meta-llama/llama-3.2-3b-instruct:free", + "canonical_model": "openrouter/meta-llama/llama-3.2-3b-instruct:free" + }, + { + "provider_model": "meta-llama/llama-3.3-70b-instruct", + "canonical_model": "meta-llama/llama-3.3-70b-instruct" + }, { "provider_model": "meta-llama/llama-3.3-70b-instruct:free", "canonical_model": "openrouter/meta-llama/llama-3.3-70b-instruct:free" }, + { + "provider_model": "minimax/minimax-01", + "canonical_model": "openrouter/minimax/minimax-01" + }, { "provider_model": "minimax/minimax-m1", "canonical_model": "openrouter/minimax/minimax-m1" @@ -4395,6 +4911,10 @@ "provider_model": "minimax/minimax-m2.1", "canonical_model": "openrouter/minimax/minimax-m2.1" }, + { + "provider_model": "minimax/minimax-m2.5", + "canonical_model": "openrouter/minimax/minimax-m2.5" + }, { "provider_model": "mistralai/codestral-2508", "canonical_model": "openrouter/mistralai/codestral" @@ -4411,6 +4931,30 @@ "provider_model": "mistralai/devstral-small", "canonical_model": "openrouter/mistralai/devstral-small" }, + { + "provider_model": "mistralai/ministral-3b-2512", + "canonical_model": "mistralai/ministral-3b" + }, + { + "provider_model": "mistralai/ministral-8b-2512", + "canonical_model": "mistralai/ministral-8b" + }, + { + "provider_model": "mistralai/mistral-large", + "canonical_model": "mistralai/mistral-large" + }, + { + "provider_model": "mistralai/mistral-large-2407", + "canonical_model": "mistralai/mistral-large" + }, + { + "provider_model": "mistralai/mistral-large-2411", + "canonical_model": "mistralai/mistral-large" + }, + { + "provider_model": "mistralai/mistral-large-2512", + "canonical_model": "mistralai/mistral-large" + }, { "provider_model": "mistralai/mistral-medium-3", "canonical_model": "openrouter/mistralai/mistral-medium-3" @@ -4419,6 +4963,10 @@ "provider_model": "mistralai/mistral-medium-3.1", "canonical_model": "openrouter/mistralai/mistral-medium-3.1" }, + { + "provider_model": "mistralai/mistral-nemo", + "canonical_model": "mistralai/mistral-nemo" + }, { "provider_model": "mistralai/mistral-small-3.1-24b-instruct", "canonical_model": "openrouter/mistralai/mistral-small-3.1-24b-instruct" @@ -4427,6 +4975,10 @@ "provider_model": "mistralai/mistral-small-3.2-24b-instruct", "canonical_model": "openrouter/mistralai/mistral-small-3.2-24b-instruct" }, + { + "provider_model": "mistralai/pixtral-large-2411", + "canonical_model": "mistralai/pixtral-large" + }, { "provider_model": "moonshotai/kimi-k2", "canonical_model": "openrouter/moonshotai/kimi-k2" @@ -4447,6 +4999,14 @@ "provider_model": "moonshotai/kimi-k2.5", "canonical_model": "openrouter/moonshotai/kimi-k2.5" }, + { + "provider_model": "nousresearch/hermes-3-llama-3.1-405b:free", + "canonical_model": "openrouter/nousresearch/hermes-3-llama-3.1-405b:free" + }, + { + "provider_model": "nousresearch/hermes-4-405b", + "canonical_model": "openrouter/nousresearch/hermes-4-405b" + }, { "provider_model": "nousresearch/hermes-4-70b", "canonical_model": "openrouter/nousresearch/hermes-4-70b" @@ -4468,32 +5028,76 @@ "canonical_model": "openrouter/nvidia/nemotron-nano-9b-v2:free" }, { - "provider_model": "openai/gpt-4.1", - "canonical_model": "openrouter/openai/gpt-4.1" + "provider_model": "openai/gpt-3.5-turbo", + "canonical_model": "openai/gpt-3.5-turbo" }, { - "provider_model": "openai/gpt-4.1-mini", - "canonical_model": "openrouter/openai/gpt-4.1-mini" + "provider_model": "openai/gpt-3.5-turbo-0613", + "canonical_model": "openai/gpt-3.5-turbo" }, { - "provider_model": "openai/gpt-4o-mini", - "canonical_model": "openrouter/openai/gpt-4o-mini" + "provider_model": "openai/gpt-4", + "canonical_model": "openai/gpt-4" }, { - "provider_model": "openai/gpt-4o-mini-2024-07-18", - "canonical_model": "openrouter/openai/gpt-4o-mini" + "provider_model": "openai/gpt-4-0314", + "canonical_model": "openai/gpt-4" }, { - "provider_model": "openai/gpt-5", - "canonical_model": "openrouter/openai/gpt-5" + "provider_model": "openai/gpt-4-turbo", + "canonical_model": "openai/gpt-4-turbo" }, { - "provider_model": "openai/gpt-5-codex", - "canonical_model": "openrouter/openai/gpt-5-codex" + "provider_model": "openai/gpt-4.1", + "canonical_model": "openrouter/openai/gpt-4.1" }, { - "provider_model": "openai/gpt-5-image", - "canonical_model": "openrouter/openai/gpt-5-image" + "provider_model": "openai/gpt-4.1-mini", + "canonical_model": "openrouter/openai/gpt-4.1-mini" + }, + { + "provider_model": "openai/gpt-4.1-nano", + "canonical_model": "openai/gpt-4.1-nano" + }, + { + "provider_model": "openai/gpt-4o", + "canonical_model": "openai/gpt-4o" + }, + { + "provider_model": "openai/gpt-4o-2024-05-13", + "canonical_model": "openai/gpt-4o" + }, + { + "provider_model": "openai/gpt-4o-2024-08-06", + "canonical_model": "openai/gpt-4o" + }, + { + "provider_model": "openai/gpt-4o-2024-11-20", + "canonical_model": "openai/gpt-4o" + }, + { + "provider_model": "openai/gpt-4o-mini", + "canonical_model": "openrouter/openai/gpt-4o-mini" + }, + { + "provider_model": "openai/gpt-4o-mini-2024-07-18", + "canonical_model": "openrouter/openai/gpt-4o-mini" + }, + { + "provider_model": "openai/gpt-5", + "canonical_model": "openrouter/openai/gpt-5" + }, + { + "provider_model": "openai/gpt-5-chat", + "canonical_model": "openrouter/openai/gpt-5-chat" + }, + { + "provider_model": "openai/gpt-5-codex", + "canonical_model": "openrouter/openai/gpt-5-codex" + }, + { + "provider_model": "openai/gpt-5-image", + "canonical_model": "openrouter/openai/gpt-5-image" }, { "provider_model": "openai/gpt-5-mini", @@ -4567,10 +5171,50 @@ "provider_model": "openai/gpt-oss-safeguard-20b", "canonical_model": "openrouter/openai/gpt-oss-safeguard-20b" }, + { + "provider_model": "openai/o1", + "canonical_model": "openai/o1" + }, + { + "provider_model": "openai/o1-pro", + "canonical_model": "openai/o1-pro" + }, + { + "provider_model": "openai/o3", + "canonical_model": "openai/o3" + }, + { + "provider_model": "openai/o3-deep-research", + "canonical_model": "openai/o3-deep-research" + }, + { + "provider_model": "openai/o3-mini", + "canonical_model": "openai/o3-mini" + }, + { + "provider_model": "openai/o3-pro", + "canonical_model": "openai/o3-pro" + }, { "provider_model": "openai/o4-mini", "canonical_model": "openrouter/openai/o4-mini" }, + { + "provider_model": "openai/o4-mini-deep-research", + "canonical_model": "openai/o4-mini-deep-research" + }, + { + "provider_model": "prime-intellect/intellect-3", + "canonical_model": "openrouter/prime-intellect/intellect-3" + }, + { + "provider_model": "qwen/qwen-2.5-coder-32b-instruct", + "canonical_model": "openrouter/qwen/qwen-2.5-coder-32b-instruct" + }, + { + "provider_model": "qwen/qwen2.5-vl-72b-instruct", + "canonical_model": "openrouter/qwen/qwen2.5-vl-72b-instruct" + }, { "provider_model": "qwen/qwen3-235b-a22b-thinking-2507", "canonical_model": "openrouter/qwen/qwen3-235b-a22b-thinking" @@ -4624,8 +5268,20 @@ "canonical_model": "openrouter/qwen/qwen3-next-80b-a3b-thinking" }, { - "provider_model": "tngtech/tng-r1t-chimera:free", - "canonical_model": "openrouter/tngtech/tng-r1t-chimera:free" + "provider_model": "qwen/qwen3.5-397b-a17b", + "canonical_model": "openrouter/qwen/qwen3.5-397b-a17b" + }, + { + "provider_model": "qwen/qwen3.5-plus-02-15", + "canonical_model": "openrouter/qwen/qwen3.5-plus-02-15" + }, + { + "provider_model": "stepfun/step-3.5-flash", + "canonical_model": "openrouter/stepfun/step-3.5-flash" + }, + { + "provider_model": "stepfun/step-3.5-flash:free", + "canonical_model": "openrouter/stepfun/step-3.5-flash:free" }, { "provider_model": "x-ai/grok-3", @@ -4694,6 +5350,10 @@ { "provider_model": "z-ai/glm-4.7-flash", "canonical_model": "openrouter/z-ai/glm-4.7-flash" + }, + { + "provider_model": "z-ai/glm-5", + "canonical_model": "openrouter/z-ai/glm-5" } ], "tetrate": [ @@ -4773,6 +5433,10 @@ "provider_model": "claude-sonnet-4-5-20250929", "canonical_model": "anthropic/claude-sonnet-4.5" }, + { + "provider_model": "claude-sonnet-4-6", + "canonical_model": "anthropic/claude-sonnet-4.6" + }, { "provider_model": "deepinfra/anthropic/claude-3-7-sonnet-latest", "canonical_model": "anthropic/claude-3.7-sonnet" @@ -4825,6 +5489,30 @@ "provider_model": "gemini-3-pro-preview", "canonical_model": "google/gemini-3-pro-preview" }, + { + "provider_model": "gemini-embedding-001", + "canonical_model": "google/gemini-embedding-001" + }, + { + "provider_model": "gpt-3.5-turbo", + "canonical_model": "openai/gpt-3.5-turbo" + }, + { + "provider_model": "gpt-3.5-turbo-0125", + "canonical_model": "openai/gpt-3.5-turbo" + }, + { + "provider_model": "gpt-3.5-turbo-1106", + "canonical_model": "openai/gpt-3.5-turbo" + }, + { + "provider_model": "gpt-4", + "canonical_model": "openai/gpt-4" + }, + { + "provider_model": "gpt-4-0613", + "canonical_model": "openai/gpt-4" + }, { "provider_model": "gpt-4-turbo", "canonical_model": "openai/gpt-4-turbo" @@ -5087,18 +5775,6 @@ ] }, "mapped_models": [ - { - "provider": "anthropic", - "model": "claude-3-5-haiku-20241022", - "canonical": "anthropic/claude-3.5-haiku", - "recommended": true - }, - { - "provider": "anthropic", - "model": "claude-3-7-sonnet-20250219", - "canonical": "anthropic/claude-3.7-sonnet", - "recommended": true - }, { "provider": "anthropic", "model": "claude-3-haiku-20240307", @@ -5147,6 +5823,12 @@ "canonical": "anthropic/claude-sonnet-4.5", "recommended": true }, + { + "provider": "anthropic", + "model": "claude-sonnet-4-6", + "canonical": "anthropic/claude-sonnet-4.6", + "recommended": true + }, { "provider": "databricks", "model": "claude-3-5-haiku", @@ -5225,6 +5907,12 @@ "canonical": "anthropic/claude-sonnet-4.5", "recommended": true }, + { + "provider": "databricks", + "model": "databricks-claude-sonnet-4-6", + "canonical": "anthropic/claude-sonnet-4.6", + "recommended": true + }, { "provider": "databricks", "model": "databricks-gemini-2-5-flash", @@ -5439,13 +6127,13 @@ "provider": "databricks", "model": "gpt-3-5-turbo", "canonical": "openai/gpt-3.5-turbo", - "recommended": true + "recommended": false }, { "provider": "databricks", "model": "gpt-3-5-turbo-0125", "canonical": "openai/gpt-3.5-turbo", - "recommended": true + "recommended": false }, { "provider": "databricks", @@ -5561,6 +6249,12 @@ "canonical": "anthropic/claude-haiku-4.5", "recommended": true }, + { + "provider": "databricks", + "model": "kgoose-claude-opus-4-6", + "canonical": "anthropic/claude-opus-4.6", + "recommended": true + }, { "provider": "databricks", "model": "kgoose-claude-sonnet-4-5", @@ -5685,13 +6379,13 @@ "provider": "databricks", "model": "o1-mini", "canonical": "openai/o1-mini", - "recommended": true + "recommended": false }, { "provider": "databricks", "model": "o1-preview", "canonical": "openai/o1-preview", - "recommended": true + "recommended": false }, { "provider": "databricks", @@ -5739,7 +6433,7 @@ "provider": "google", "model": "gemini-2.5-flash-image", "canonical": "google/gemini-2.5-flash-image", - "recommended": true + "recommended": false }, { "provider": "google", @@ -5753,17 +6447,11 @@ "canonical": "google/gemini-2.5-flash-lite-preview-09", "recommended": true }, - { - "provider": "google", - "model": "gemini-2.5-flash-preview-09-2025", - "canonical": "google/gemini-2.5-flash-preview-09", - "recommended": true - }, { "provider": "google", "model": "gemini-2.5-flash-preview-tts", "canonical": "google/gemini-2.5-flash-preview-tts", - "recommended": true + "recommended": false }, { "provider": "google", @@ -5775,7 +6463,7 @@ "provider": "google", "model": "gemini-2.5-pro-preview-tts", "canonical": "google/gemini-2.5-pro-preview-tts", - "recommended": true + "recommended": false }, { "provider": "google", @@ -5793,7 +6481,7 @@ "provider": "google", "model": "gemini-embedding-001", "canonical": "google/gemini-embedding-001", - "recommended": true + "recommended": false }, { "provider": "google", @@ -5811,19 +6499,19 @@ "provider": "openai", "model": "gpt-3.5-turbo", "canonical": "openai/gpt-3.5-turbo", - "recommended": true + "recommended": false }, { "provider": "openai", "model": "gpt-3.5-turbo-0125", "canonical": "openai/gpt-3.5-turbo", - "recommended": true + "recommended": false }, { "provider": "openai", "model": "gpt-3.5-turbo-1106", "canonical": "openai/gpt-3.5-turbo", - "recommended": true + "recommended": false }, { "provider": "openai", @@ -5943,7 +6631,7 @@ "provider": "openai", "model": "gpt-5-chat-latest", "canonical": "openai/gpt-5-chat", - "recommended": true + "recommended": false }, { "provider": "openai", @@ -6159,18 +6847,24 @@ "provider": "openai", "model": "text-embedding-3-large", "canonical": "openai/text-embedding-3-large", - "recommended": true + "recommended": false }, { "provider": "openai", "model": "text-embedding-3-small", "canonical": "openai/text-embedding-3-small", - "recommended": true + "recommended": false }, { "provider": "openai", "model": "text-embedding-ada-002", "canonical": "openai/text-embedding-ada-002", + "recommended": false + }, + { + "provider": "openrouter", + "model": "anthropic/claude-3-haiku", + "canonical": "anthropic/claude-3-haiku", "recommended": true }, { @@ -6179,6 +6873,12 @@ "canonical": "openrouter/anthropic/claude-3.5-haiku", "recommended": true }, + { + "provider": "openrouter", + "model": "anthropic/claude-3.5-sonnet", + "canonical": "anthropic/claude-3.5-sonnet", + "recommended": true + }, { "provider": "openrouter", "model": "anthropic/claude-3.7-sonnet", @@ -6227,6 +6927,12 @@ "canonical": "openrouter/anthropic/claude-sonnet-4.5", "recommended": true }, + { + "provider": "openrouter", + "model": "anthropic/claude-sonnet-4.6", + "canonical": "anthropic/claude-sonnet-4.6", + "recommended": true + }, { "provider": "openrouter", "model": "arcee-ai/trinity-large-preview:free", @@ -6239,11 +6945,41 @@ "canonical": "openrouter/arcee-ai/trinity-mini:free", "recommended": true }, + { + "provider": "openrouter", + "model": "cognitivecomputations/dolphin-mistral-24b-venice-edition:free", + "canonical": "openrouter/cognitivecomputations/dolphin-mistral-24b-venice-edition:free", + "recommended": false + }, + { + "provider": "openrouter", + "model": "cohere/command-r-08-2024", + "canonical": "cohere/command-r-08", + "recommended": true + }, + { + "provider": "openrouter", + "model": "cohere/command-r-plus-08-2024", + "canonical": "cohere/command-r-plus-08", + "recommended": true + }, + { + "provider": "openrouter", + "model": "cohere/command-r7b-12-2024", + "canonical": "cohere/command-r7b-12", + "recommended": true + }, + { + "provider": "openrouter", + "model": "deepseek/deepseek-chat", + "canonical": "deepseek/deepseek-chat", + "recommended": true + }, { "provider": "openrouter", "model": "deepseek/deepseek-chat-v3-0324", "canonical": "openrouter/deepseek/deepseek-chat-v3", - "recommended": true + "recommended": false }, { "provider": "openrouter", @@ -6251,6 +6987,18 @@ "canonical": "openrouter/deepseek/deepseek-chat-v3.1", "recommended": true }, + { + "provider": "openrouter", + "model": "deepseek/deepseek-r1-0528:free", + "canonical": "openrouter/deepseek/deepseek-r1-0528:free", + "recommended": false + }, + { + "provider": "openrouter", + "model": "deepseek/deepseek-r1-distill-llama-70b", + "canonical": "openrouter/deepseek/deepseek-r1-distill-llama-70b", + "recommended": false + }, { "provider": "openrouter", "model": "deepseek/deepseek-v3.1-terminus", @@ -6269,6 +7017,12 @@ "canonical": "openrouter/deepseek/deepseek-v3.2", "recommended": true }, + { + "provider": "openrouter", + "model": "deepseek/deepseek-v3.2-speciale", + "canonical": "openrouter/deepseek/deepseek-v3.2-speciale", + "recommended": true + }, { "provider": "openrouter", "model": "google/gemini-2.0-flash-001", @@ -6281,6 +7035,12 @@ "canonical": "openrouter/google/gemini-2.5-flash", "recommended": true }, + { + "provider": "openrouter", + "model": "google/gemini-2.5-flash-image", + "canonical": "google/gemini-2.5-flash-image", + "recommended": false + }, { "provider": "openrouter", "model": "google/gemini-2.5-flash-lite", @@ -6293,12 +7053,6 @@ "canonical": "openrouter/google/gemini-2.5-flash-lite-preview-09", "recommended": true }, - { - "provider": "openrouter", - "model": "google/gemini-2.5-flash-preview-09-2025", - "canonical": "openrouter/google/gemini-2.5-flash-preview-09", - "recommended": true - }, { "provider": "openrouter", "model": "google/gemini-2.5-pro", @@ -6323,6 +7077,24 @@ "canonical": "openrouter/google/gemini-3-pro-preview", "recommended": true }, + { + "provider": "openrouter", + "model": "google/gemma-2-9b-it", + "canonical": "openrouter/google/gemma-2-9b-it", + "recommended": false + }, + { + "provider": "openrouter", + "model": "google/gemma-3-12b-it", + "canonical": "openrouter/google/gemma-3-12b-it", + "recommended": false + }, + { + "provider": "openrouter", + "model": "google/gemma-3-12b-it:free", + "canonical": "openrouter/google/gemma-3-12b-it:free", + "recommended": false + }, { "provider": "openrouter", "model": "google/gemma-3-27b-it", @@ -6335,12 +7107,78 @@ "canonical": "openrouter/google/gemma-3-27b-it:free", "recommended": true }, + { + "provider": "openrouter", + "model": "google/gemma-3-4b-it", + "canonical": "openrouter/google/gemma-3-4b-it", + "recommended": false + }, + { + "provider": "openrouter", + "model": "google/gemma-3-4b-it:free", + "canonical": "openrouter/google/gemma-3-4b-it:free", + "recommended": false + }, + { + "provider": "openrouter", + "model": "google/gemma-3n-e2b-it:free", + "canonical": "openrouter/google/gemma-3n-e2b-it:free", + "recommended": false + }, + { + "provider": "openrouter", + "model": "google/gemma-3n-e4b-it", + "canonical": "openrouter/google/gemma-3n-e4b-it", + "recommended": false + }, + { + "provider": "openrouter", + "model": "google/gemma-3n-e4b-it:free", + "canonical": "openrouter/google/gemma-3n-e4b-it:free", + "recommended": false + }, + { + "provider": "openrouter", + "model": "liquid/lfm-2.5-1.2b-instruct:free", + "canonical": "openrouter/liquid/lfm-2.5-1.2b-instruct:free", + "recommended": false + }, + { + "provider": "openrouter", + "model": "liquid/lfm-2.5-1.2b-thinking:free", + "canonical": "openrouter/liquid/lfm-2.5-1.2b-thinking:free", + "recommended": false + }, + { + "provider": "openrouter", + "model": "meta-llama/llama-3.2-11b-vision-instruct", + "canonical": "openrouter/meta-llama/llama-3.2-11b-vision-instruct", + "recommended": false + }, + { + "provider": "openrouter", + "model": "meta-llama/llama-3.2-3b-instruct:free", + "canonical": "openrouter/meta-llama/llama-3.2-3b-instruct:free", + "recommended": false + }, + { + "provider": "openrouter", + "model": "meta-llama/llama-3.3-70b-instruct", + "canonical": "meta-llama/llama-3.3-70b-instruct", + "recommended": true + }, { "provider": "openrouter", "model": "meta-llama/llama-3.3-70b-instruct:free", "canonical": "openrouter/meta-llama/llama-3.3-70b-instruct:free", "recommended": true }, + { + "provider": "openrouter", + "model": "minimax/minimax-01", + "canonical": "openrouter/minimax/minimax-01", + "recommended": true + }, { "provider": "openrouter", "model": "minimax/minimax-m1", @@ -6359,6 +7197,12 @@ "canonical": "openrouter/minimax/minimax-m2.1", "recommended": true }, + { + "provider": "openrouter", + "model": "minimax/minimax-m2.5", + "canonical": "openrouter/minimax/minimax-m2.5", + "recommended": true + }, { "provider": "openrouter", "model": "mistralai/codestral-2508", @@ -6383,6 +7227,42 @@ "canonical": "openrouter/mistralai/devstral-small", "recommended": true }, + { + "provider": "openrouter", + "model": "mistralai/ministral-3b-2512", + "canonical": "mistralai/ministral-3b", + "recommended": true + }, + { + "provider": "openrouter", + "model": "mistralai/ministral-8b-2512", + "canonical": "mistralai/ministral-8b", + "recommended": true + }, + { + "provider": "openrouter", + "model": "mistralai/mistral-large", + "canonical": "mistralai/mistral-large", + "recommended": true + }, + { + "provider": "openrouter", + "model": "mistralai/mistral-large-2407", + "canonical": "mistralai/mistral-large", + "recommended": true + }, + { + "provider": "openrouter", + "model": "mistralai/mistral-large-2411", + "canonical": "mistralai/mistral-large", + "recommended": true + }, + { + "provider": "openrouter", + "model": "mistralai/mistral-large-2512", + "canonical": "mistralai/mistral-large", + "recommended": true + }, { "provider": "openrouter", "model": "mistralai/mistral-medium-3", @@ -6395,6 +7275,12 @@ "canonical": "openrouter/mistralai/mistral-medium-3.1", "recommended": true }, + { + "provider": "openrouter", + "model": "mistralai/mistral-nemo", + "canonical": "mistralai/mistral-nemo", + "recommended": true + }, { "provider": "openrouter", "model": "mistralai/mistral-small-3.1-24b-instruct", @@ -6407,6 +7293,12 @@ "canonical": "openrouter/mistralai/mistral-small-3.2-24b-instruct", "recommended": true }, + { + "provider": "openrouter", + "model": "mistralai/pixtral-large-2411", + "canonical": "mistralai/pixtral-large", + "recommended": true + }, { "provider": "openrouter", "model": "moonshotai/kimi-k2", @@ -6437,6 +7329,18 @@ "canonical": "openrouter/moonshotai/kimi-k2.5", "recommended": true }, + { + "provider": "openrouter", + "model": "nousresearch/hermes-3-llama-3.1-405b:free", + "canonical": "openrouter/nousresearch/hermes-3-llama-3.1-405b:free", + "recommended": false + }, + { + "provider": "openrouter", + "model": "nousresearch/hermes-4-405b", + "canonical": "openrouter/nousresearch/hermes-4-405b", + "recommended": true + }, { "provider": "openrouter", "model": "nousresearch/hermes-4-70b", @@ -6467,6 +7371,36 @@ "canonical": "openrouter/nvidia/nemotron-nano-9b-v2:free", "recommended": true }, + { + "provider": "openrouter", + "model": "openai/gpt-3.5-turbo", + "canonical": "openai/gpt-3.5-turbo", + "recommended": false + }, + { + "provider": "openrouter", + "model": "openai/gpt-3.5-turbo-0613", + "canonical": "openai/gpt-3.5-turbo", + "recommended": false + }, + { + "provider": "openrouter", + "model": "openai/gpt-4", + "canonical": "openai/gpt-4", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/gpt-4-0314", + "canonical": "openai/gpt-4", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/gpt-4-turbo", + "canonical": "openai/gpt-4-turbo", + "recommended": true + }, { "provider": "openrouter", "model": "openai/gpt-4.1", @@ -6479,6 +7413,36 @@ "canonical": "openrouter/openai/gpt-4.1-mini", "recommended": true }, + { + "provider": "openrouter", + "model": "openai/gpt-4.1-nano", + "canonical": "openai/gpt-4.1-nano", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/gpt-4o", + "canonical": "openai/gpt-4o", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/gpt-4o-2024-05-13", + "canonical": "openai/gpt-4o", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/gpt-4o-2024-08-06", + "canonical": "openai/gpt-4o", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/gpt-4o-2024-11-20", + "canonical": "openai/gpt-4o", + "recommended": true + }, { "provider": "openrouter", "model": "openai/gpt-4o-mini", @@ -6497,6 +7461,12 @@ "canonical": "openrouter/openai/gpt-5", "recommended": true }, + { + "provider": "openrouter", + "model": "openai/gpt-5-chat", + "canonical": "openrouter/openai/gpt-5-chat", + "recommended": false + }, { "provider": "openrouter", "model": "openai/gpt-5-codex", @@ -6617,12 +7587,72 @@ "canonical": "openrouter/openai/gpt-oss-safeguard-20b", "recommended": true }, + { + "provider": "openrouter", + "model": "openai/o1", + "canonical": "openai/o1", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/o1-pro", + "canonical": "openai/o1-pro", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/o3", + "canonical": "openai/o3", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/o3-deep-research", + "canonical": "openai/o3-deep-research", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/o3-mini", + "canonical": "openai/o3-mini", + "recommended": true + }, + { + "provider": "openrouter", + "model": "openai/o3-pro", + "canonical": "openai/o3-pro", + "recommended": true + }, { "provider": "openrouter", "model": "openai/o4-mini", "canonical": "openrouter/openai/o4-mini", "recommended": true }, + { + "provider": "openrouter", + "model": "openai/o4-mini-deep-research", + "canonical": "openai/o4-mini-deep-research", + "recommended": true + }, + { + "provider": "openrouter", + "model": "prime-intellect/intellect-3", + "canonical": "openrouter/prime-intellect/intellect-3", + "recommended": true + }, + { + "provider": "openrouter", + "model": "qwen/qwen-2.5-coder-32b-instruct", + "canonical": "openrouter/qwen/qwen-2.5-coder-32b-instruct", + "recommended": false + }, + { + "provider": "openrouter", + "model": "qwen/qwen2.5-vl-72b-instruct", + "canonical": "openrouter/qwen/qwen2.5-vl-72b-instruct", + "recommended": false + }, { "provider": "openrouter", "model": "qwen/qwen3-235b-a22b-thinking-2507", @@ -6703,8 +7733,26 @@ }, { "provider": "openrouter", - "model": "tngtech/tng-r1t-chimera:free", - "canonical": "openrouter/tngtech/tng-r1t-chimera:free", + "model": "qwen/qwen3.5-397b-a17b", + "canonical": "openrouter/qwen/qwen3.5-397b-a17b", + "recommended": true + }, + { + "provider": "openrouter", + "model": "qwen/qwen3.5-plus-02-15", + "canonical": "openrouter/qwen/qwen3.5-plus-02-15", + "recommended": true + }, + { + "provider": "openrouter", + "model": "stepfun/step-3.5-flash", + "canonical": "openrouter/stepfun/step-3.5-flash", + "recommended": true + }, + { + "provider": "openrouter", + "model": "stepfun/step-3.5-flash:free", + "canonical": "openrouter/stepfun/step-3.5-flash:free", "recommended": true }, { @@ -6777,7 +7825,7 @@ "provider": "openrouter", "model": "z-ai/glm-4.5-air:free", "canonical": "openrouter/z-ai/glm-4.5-air:free", - "recommended": true + "recommended": false }, { "provider": "openrouter", @@ -6809,6 +7857,12 @@ "canonical": "openrouter/z-ai/glm-4.7-flash", "recommended": true }, + { + "provider": "openrouter", + "model": "z-ai/glm-5", + "canonical": "openrouter/z-ai/glm-5", + "recommended": true + }, { "provider": "tetrate", "model": "claude-3-5-haiku-20241022", @@ -6923,6 +7977,12 @@ "canonical": "anthropic/claude-sonnet-4.5", "recommended": true }, + { + "provider": "tetrate", + "model": "claude-sonnet-4-6", + "canonical": "anthropic/claude-sonnet-4.6", + "recommended": true + }, { "provider": "tetrate", "model": "deepinfra/anthropic/claude-3-7-sonnet-latest", @@ -7001,6 +8061,42 @@ "canonical": "google/gemini-3-pro-preview", "recommended": true }, + { + "provider": "tetrate", + "model": "gemini-embedding-001", + "canonical": "google/gemini-embedding-001", + "recommended": false + }, + { + "provider": "tetrate", + "model": "gpt-3.5-turbo", + "canonical": "openai/gpt-3.5-turbo", + "recommended": false + }, + { + "provider": "tetrate", + "model": "gpt-3.5-turbo-0125", + "canonical": "openai/gpt-3.5-turbo", + "recommended": false + }, + { + "provider": "tetrate", + "model": "gpt-3.5-turbo-1106", + "canonical": "openai/gpt-3.5-turbo", + "recommended": false + }, + { + "provider": "tetrate", + "model": "gpt-4", + "canonical": "openai/gpt-4", + "recommended": true + }, + { + "provider": "tetrate", + "model": "gpt-4-0613", + "canonical": "openai/gpt-4", + "recommended": true + }, { "provider": "tetrate", "model": "gpt-4-turbo", @@ -7101,7 +8197,7 @@ "provider": "tetrate", "model": "gpt-5-chat-latest", "canonical": "openai/gpt-5-chat", - "recommended": true + "recommended": false }, { "provider": "tetrate", @@ -7387,15 +8483,15 @@ } ], "model_counts": { - "anthropic": 12, + "anthropic": 11, "aws_bedrock": 0, "azure_openai": 0, - "databricks": 163, + "databricks": 168, "gcp_vertex_ai": 0, - "google": 45, - "openai": 652, - "openrouter": 230, - "tetrate": 151, + "google": 43, + "openai": 659, + "openrouter": 337, + "tetrate": 207, "venice": 0, "xai": 13 }, @@ -7414,6 +8510,11 @@ "anthropic/claude-sonnet-4", "anthropic/claude-sonnet-4.0", "anthropic/claude-sonnet-4.5", + "anthropic/claude-sonnet-4.6", + "cohere/command-r-08", + "cohere/command-r-plus-08", + "cohere/command-r7b-12", + "deepseek/deepseek-chat", "google/gemini-1.5-flash", "google/gemini-1.5-pro", "google/gemini-2.0-flash", @@ -7432,6 +8533,11 @@ "google/gemini-flash", "google/gemini-flash-lite", "meta-llama/llama-3.3-70b-instruct", + "mistralai/ministral-3b", + "mistralai/ministral-8b", + "mistralai/mistral-large", + "mistralai/mistral-nemo", + "mistralai/pixtral-large", "openai/gpt-3.5-turbo", "openai/gpt-4", "openai/gpt-4-turbo", @@ -7479,26 +8585,43 @@ "openrouter/anthropic/claude-sonnet-4.5", "openrouter/arcee-ai/trinity-large-preview:free", "openrouter/arcee-ai/trinity-mini:free", + "openrouter/cognitivecomputations/dolphin-mistral-24b-venice-edition:free", "openrouter/deepseek/deepseek-chat-v3", "openrouter/deepseek/deepseek-chat-v3.1", + "openrouter/deepseek/deepseek-r1-0528:free", + "openrouter/deepseek/deepseek-r1-distill-llama-70b", "openrouter/deepseek/deepseek-v3.1-terminus", "openrouter/deepseek/deepseek-v3.1-terminus:exacto", "openrouter/deepseek/deepseek-v3.2", + "openrouter/deepseek/deepseek-v3.2-speciale", "openrouter/google/gemini-2.0-flash-001", "openrouter/google/gemini-2.5-flash", "openrouter/google/gemini-2.5-flash-lite", "openrouter/google/gemini-2.5-flash-lite-preview-09", - "openrouter/google/gemini-2.5-flash-preview-09", "openrouter/google/gemini-2.5-pro", "openrouter/google/gemini-2.5-pro-preview-05-06", "openrouter/google/gemini-3-flash-preview", "openrouter/google/gemini-3-pro-preview", + "openrouter/google/gemma-2-9b-it", + "openrouter/google/gemma-3-12b-it", + "openrouter/google/gemma-3-12b-it:free", "openrouter/google/gemma-3-27b-it", "openrouter/google/gemma-3-27b-it:free", + "openrouter/google/gemma-3-4b-it", + "openrouter/google/gemma-3-4b-it:free", + "openrouter/google/gemma-3n-e2b-it:free", + "openrouter/google/gemma-3n-e4b-it", + "openrouter/google/gemma-3n-e4b-it:free", + "openrouter/liquid/lfm-2.5-1.2b-instruct:free", + "openrouter/liquid/lfm-2.5-1.2b-thinking:free", + "openrouter/meta-llama/llama-3.2-11b-vision-instruct", + "openrouter/meta-llama/llama-3.2-3b-instruct:free", "openrouter/meta-llama/llama-3.3-70b-instruct:free", + "openrouter/minimax/minimax-01", "openrouter/minimax/minimax-m1", "openrouter/minimax/minimax-m2", "openrouter/minimax/minimax-m2.1", + "openrouter/minimax/minimax-m2.5", "openrouter/mistralai/codestral", "openrouter/mistralai/devstral", "openrouter/mistralai/devstral-medium", @@ -7511,6 +8634,8 @@ "openrouter/moonshotai/kimi-k2-0905:exacto", "openrouter/moonshotai/kimi-k2-thinking", "openrouter/moonshotai/kimi-k2.5", + "openrouter/nousresearch/hermes-3-llama-3.1-405b:free", + "openrouter/nousresearch/hermes-4-405b", "openrouter/nousresearch/hermes-4-70b", "openrouter/nvidia/nemotron-3-nano-30b-a3b:free", "openrouter/nvidia/nemotron-nano-12b-v2-vl:free", @@ -7520,6 +8645,7 @@ "openrouter/openai/gpt-4.1-mini", "openrouter/openai/gpt-4o-mini", "openrouter/openai/gpt-5", + "openrouter/openai/gpt-5-chat", "openrouter/openai/gpt-5-codex", "openrouter/openai/gpt-5-image", "openrouter/openai/gpt-5-mini", @@ -7541,6 +8667,9 @@ "openrouter/openai/gpt-oss-20b:free", "openrouter/openai/gpt-oss-safeguard-20b", "openrouter/openai/o4-mini", + "openrouter/prime-intellect/intellect-3", + "openrouter/qwen/qwen-2.5-coder-32b-instruct", + "openrouter/qwen/qwen2.5-vl-72b-instruct", "openrouter/qwen/qwen3-235b-a22b-thinking", "openrouter/qwen/qwen3-30b-a3b-instruct", "openrouter/qwen/qwen3-30b-a3b-thinking", @@ -7554,7 +8683,10 @@ "openrouter/qwen/qwen3-next-80b-a3b-instruct", "openrouter/qwen/qwen3-next-80b-a3b-instruct:free", "openrouter/qwen/qwen3-next-80b-a3b-thinking", - "openrouter/tngtech/tng-r1t-chimera:free", + "openrouter/qwen/qwen3.5-397b-a17b", + "openrouter/qwen/qwen3.5-plus-02-15", + "openrouter/stepfun/step-3.5-flash", + "openrouter/stepfun/step-3.5-flash:free", "openrouter/x-ai/grok-3", "openrouter/x-ai/grok-3-beta", "openrouter/x-ai/grok-3-mini", @@ -7572,6 +8704,7 @@ "openrouter/z-ai/glm-4.6:exacto", "openrouter/z-ai/glm-4.7", "openrouter/z-ai/glm-4.7-flash", + "openrouter/z-ai/glm-5", "x-ai/grok-2-vision", "x-ai/grok-3", "x-ai/grok-3-fast", diff --git a/crates/goose/src/providers/canonical/data/canonical_models.json b/crates/goose/src/providers/canonical/data/canonical_models.json index 0d2320e51728..4d46e28f22ee 100644 --- a/crates/goose/src/providers/canonical/data/canonical_models.json +++ b/crates/goose/src/providers/canonical/data/canonical_models.json @@ -1,15 +1,14 @@ [ { - "id": "amazon-bedrock/ai21.jamba-1.5-large-v1:0", - "name": "Jamba 1.5 Large", - "family": "jamba", + "id": "302ai/MiniMax-M1", + "name": "MiniMax-M1", + "family": "minimax", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "modalities": { "input": [ "text" @@ -18,27 +17,25 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 2.0, - "output": 8.0 + "input": 0.132, + "output": 1.254 }, "limit": { - "context": 256000, - "output": 4096 + "context": 1000000, + "output": 128000 } }, { - "id": "amazon-bedrock/ai21.jamba-1.5-mini-v1:0", - "name": "Jamba 1.5 Mini", - "family": "jamba", + "id": "302ai/MiniMax-M2", + "name": "MiniMax-M2", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2025-10-26", + "last_updated": "2025-10-26", "modalities": { "input": [ "text" @@ -47,31 +44,28 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.2, - "output": 0.4 + "input": 0.33, + "output": 1.32 }, "limit": { - "context": 256000, - "output": 4096 + "context": 1000000, + "output": 128000 } }, { - "id": "amazon-bedrock/amazon.nova-2-lite-v1:0", - "name": "Nova 2 Lite", - "family": "nova", + "id": "302ai/MiniMax-M2.1", + "name": "MiniMax-M2.1", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -79,60 +73,29 @@ }, "open_weights": false, "cost": { - "input": 0.33, - "output": 2.75 + "input": 0.3, + "output": 1.2 }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 131072 } }, { - "id": "amazon-bedrock/amazon.nova-lite-v1:0", - "name": "Nova Lite", - "family": "nova-lite", + "id": "302ai/chatgpt-4o", + "name": "chatgpt-4o-latest", + "family": "gpt", "attachment": true, "reasoning": false, - "tool_call": true, + "tool_call": false, "temperature": true, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2023-09", + "release_date": "2024-08-08", + "last_updated": "2024-08-08", "modalities": { "input": [ "text", - "image", - "video" - ], - "output": [ - "text" - ] - }, - "open_weights": false, - "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 - }, - "limit": { - "context": 300000, - "output": 8192 - } - }, - { - "id": "amazon-bedrock/amazon.nova-micro-v1:0", - "name": "Nova Micro", - "family": "nova-micro", - "attachment": false, - "reasoning": false, - "tool_call": true, - "temperature": true, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", - "modalities": { - "input": [ - "text" + "image" ], "output": [ "text" @@ -140,31 +103,28 @@ }, "open_weights": false, "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 + "input": 5.0, + "output": 15.0 }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 } }, { - "id": "amazon-bedrock/amazon.nova-premier-v1:0", - "name": "Nova Premier", - "family": "nova", + "id": "302ai/claude-haiku-4.5", + "name": "claude-haiku-4-5-20251001", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2025-03", + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" @@ -172,30 +132,28 @@ }, "open_weights": false, "cost": { - "input": 2.5, - "output": 12.5 + "input": 1.0, + "output": 5.0 }, "limit": { - "context": 1000000, - "output": 16384 + "context": 200000, + "output": 64000 } }, { - "id": "amazon-bedrock/amazon.nova-pro-v1:0", - "name": "Nova Pro", - "family": "nova-pro", + "id": "302ai/claude-opus-4.1", + "name": "claude-opus-4-1-20250805", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2025-03", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" @@ -203,28 +161,28 @@ }, "open_weights": false, "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 + "input": 15.0, + "output": 75.0 }, "limit": { - "context": 300000, - "output": 8192 + "context": 200000, + "output": 32000 } }, { - "id": "amazon-bedrock/amazon.titan-text-express-v1", - "name": "Titan Text G1 - Express", - "family": "titan", - "attachment": false, - "reasoning": false, + "id": "302ai/claude-opus-4.1-20250805-thinking", + "name": "claude-opus-4-1-20250805-thinking", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-03", + "release_date": "2025-05-27", + "last_updated": "2025-05-27", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -232,27 +190,28 @@ }, "open_weights": false, "cost": { - "input": 0.2, - "output": 0.6 + "input": 15.0, + "output": 75.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 } }, { - "id": "amazon-bedrock/amazon.titan-text-express-v1:0:8k", - "name": "Titan Text G1 - Express", - "family": "titan", - "attachment": false, + "id": "302ai/claude-opus-4.5", + "name": "claude-opus-4-5-20251101", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-03", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -260,30 +219,28 @@ }, "open_weights": false, "cost": { - "input": 0.2, - "output": 0.6 + "input": 5.0, + "output": 25.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 } }, { - "id": "amazon-bedrock/anthropic.claude-3-haiku-20240307-v1:0", - "name": "Claude Haiku 3", - "family": "claude-haiku", + "id": "302ai/claude-opus-4.5-20251101-thinking", + "name": "claude-opus-4-5-20251101-thinking", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-02", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2025-03", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -291,30 +248,28 @@ }, "open_weights": false, "cost": { - "input": 0.25, - "output": 1.25 + "input": 5.0, + "output": 25.0 }, "limit": { "context": 200000, - "output": 4096 + "output": 64000 } }, { - "id": "amazon-bedrock/anthropic.claude-3-opus-20240229-v1:0", - "name": "Claude Opus 3", - "family": "claude-opus", + "id": "302ai/claude-sonnet-4.5", + "name": "claude-sonnet-4-5-20250929", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-08", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "knowledge": "2025-03", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -322,30 +277,28 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0 + "input": 3.0, + "output": 15.0 }, "limit": { "context": 200000, - "output": 4096 + "output": 64000 } }, { - "id": "amazon-bedrock/anthropic.claude-3-sonnet-20240229-v1:0", - "name": "Claude Sonnet 3", - "family": "claude-sonnet", + "id": "302ai/claude-sonnet-4.5-20250929-thinking", + "name": "claude-sonnet-4-5-20250929-thinking", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-08", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "knowledge": "2025-03", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -358,25 +311,23 @@ }, "limit": { "context": 200000, - "output": 4096 + "output": 64000 } }, { - "id": "amazon-bedrock/anthropic.claude-3.5-haiku-20241022-v1:0", - "name": "Claude Haiku 3.5", - "family": "claude-haiku", - "attachment": true, + "id": "302ai/deepseek-chat", + "name": "Deepseek-Chat", + "family": "deepseek", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, "knowledge": "2024-07", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -384,32 +335,28 @@ }, "open_weights": false, "cost": { - "input": 0.8, - "output": 4.0, - "cache_read": 0.08, - "cache_write": 1.0 + "input": 0.29, + "output": 0.43 }, "limit": { - "context": 200000, + "context": 128000, "output": 8192 } }, { - "id": "amazon-bedrock/anthropic.claude-3.5-sonnet-20240620-v1:0", - "name": "Claude Sonnet 3.5", - "family": "claude-sonnet", - "attachment": true, - "reasoning": false, + "id": "302ai/deepseek-reasoner", + "name": "Deepseek-Reasoner", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -417,32 +364,27 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.29, + "output": 0.43 }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 128000 } }, { - "id": "amazon-bedrock/anthropic.claude-3.5-sonnet-20241022-v2:0", - "name": "Claude Sonnet 3.5 v2", - "family": "claude-sonnet", - "attachment": true, + "id": "302ai/deepseek-v3.2", + "name": "deepseek-v3.2", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -450,32 +392,27 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.29, + "output": 0.43 }, "limit": { - "context": 200000, + "context": 128000, "output": 8192 } }, { - "id": "amazon-bedrock/anthropic.claude-3.7-sonnet-20250219-v1:0", - "name": "Claude Sonnet 3.7", - "family": "claude-sonnet", - "attachment": true, - "reasoning": false, + "id": "302ai/deepseek-v3.2-thinking", + "name": "DeepSeek-V3.2-Thinking", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -483,32 +420,27 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.29, + "output": 0.43 }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 128000 } }, { - "id": "amazon-bedrock/anthropic.claude-haiku-4.5-20251001-v1:0", - "name": "Claude Haiku 4.5", - "family": "claude-haiku", + "id": "302ai/doubao-seed-1.6-thinking-250715", + "name": "doubao-seed-1-6-thinking-250715", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -516,30 +448,27 @@ }, "open_weights": false, "cost": { - "input": 1.0, - "output": 5.0, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.121, + "output": 1.21 }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 16000 } }, { - "id": "amazon-bedrock/anthropic.claude-instant-v1", - "name": "Claude Instant", - "family": "claude", - "attachment": false, + "id": "302ai/doubao-seed-1.6-vision-250815", + "name": "doubao-seed-1-6-vision-250815", + "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -547,30 +476,27 @@ }, "open_weights": false, "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.114, + "output": 1.143 }, "limit": { - "context": 100000, - "output": 4096 + "context": 256000, + "output": 32000 } }, { - "id": "amazon-bedrock/anthropic.claude-opus-4-20250514-v1:0", - "name": "Claude Opus 4", - "family": "claude-opus", + "id": "302ai/doubao-seed-1.8-251215", + "name": "doubao-seed-1-8-251215", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -578,32 +504,27 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.114, + "output": 0.286 }, "limit": { - "context": 200000, - "output": 32000 + "context": 224000, + "output": 64000 } }, { - "id": "amazon-bedrock/anthropic.claude-opus-4.1-20250805-v1:0", - "name": "Claude Opus 4.1", - "family": "claude-opus", + "id": "302ai/doubao-seed-code-preview-251028", + "name": "doubao-seed-code-preview-251028", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-11-11", + "last_updated": "2025-11-11", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -611,32 +532,29 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.17, + "output": 1.14 }, "limit": { - "context": 200000, + "context": 256000, "output": 32000 } }, { - "id": "amazon-bedrock/anthropic.claude-opus-4.5-20251101-v1:0", - "name": "Claude Opus 4.5", - "family": "claude-opus", + "id": "302ai/gemini-2.0-flash-lite", + "name": "gemini-2.0-flash-lite", + "family": "gemini-flash-lite", "attachment": true, - "reasoning": true, - "tool_call": true, + "reasoning": false, + "tool_call": false, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2024-11", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -644,32 +562,29 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.075, + "output": 0.3 }, "limit": { - "context": 200000, - "output": 64000 + "context": 2000000, + "output": 8192 } }, { - "id": "amazon-bedrock/anthropic.claude-opus-4.6-v1", - "name": "Claude Opus 4.6", - "family": "claude-opus", + "id": "302ai/gemini-2.5-flash", + "name": "gemini-2.5-flash", + "family": "gemini-flash", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -677,32 +592,28 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 2.5 }, "limit": { "context": 1000000, - "output": 128000 + "output": 65536 } }, { - "id": "amazon-bedrock/anthropic.claude-sonnet-4-20250514-v1:0", - "name": "Claude Sonnet 4", - "family": "claude-sonnet", + "id": "302ai/gemini-2.5-flash-image", + "name": "gemini-2.5-flash-image", "attachment": true, - "reasoning": true, - "tool_call": true, + "reasoning": false, + "tool_call": false, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -710,32 +621,28 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 30.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 32768 } }, { - "id": "amazon-bedrock/anthropic.claude-sonnet-4.5-20250929-v1:0", - "name": "Claude Sonnet 4.5", - "family": "claude-sonnet", + "id": "302ai/gemini-2.5-flash-lite-preview-09", + "name": "gemini-2.5-flash-lite-preview-09-2025", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -743,30 +650,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.1, + "output": 0.4 }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 65536 } }, { - "id": "amazon-bedrock/anthropic.claude-v2", - "name": "Claude 2", - "family": "claude", - "attachment": false, + "id": "302ai/gemini-2.5-flash-nothink", + "name": "gemini-2.5-flash-nothink", + "family": "gemini-flash", + "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-08", - "release_date": "2023-07-11", - "last_updated": "2023-07-11", + "knowledge": "2025-01", + "release_date": "2025-06-24", + "last_updated": "2025-06-24", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -774,28 +680,28 @@ }, "open_weights": false, "cost": { - "input": 8.0, - "output": 24.0 + "input": 0.3, + "output": 2.5 }, "limit": { - "context": 100000, - "output": 4096 + "context": 1000000, + "output": 65536 } }, { - "id": "amazon-bedrock/anthropic.claude-v2:1", - "name": "Claude 2.1", - "family": "claude", - "attachment": false, + "id": "302ai/gemini-2.5-flash-preview-09", + "name": "gemini-2.5-flash-preview-09-2025", + "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-08", - "release_date": "2023-11-21", - "last_updated": "2023-11-21", + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -803,112 +709,141 @@ }, "open_weights": false, "cost": { - "input": 8.0, - "output": 24.0 + "input": 0.3, + "output": 2.5 }, "limit": { - "context": 200000, - "output": 4096 + "context": 1000000, + "output": 65536 } }, { - "id": "amazon-bedrock/cohere.command-light-text-v14", - "name": "Command Light", - "family": "command-light", - "attachment": false, + "id": "302ai/gemini-2.5-pro", + "name": "gemini-2.5-pro", + "family": "gemini-pro", + "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-08", - "release_date": "2023-11-01", - "last_updated": "2023-11-01", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.3, - "output": 0.6 + "input": 1.25, + "output": 10.0 }, "limit": { - "context": 4096, - "output": 4096 + "context": 1000000, + "output": 65536 } }, { - "id": "amazon-bedrock/cohere.command-r-plus-v1:0", - "name": "Command R+", - "family": "command-r", - "attachment": false, + "id": "302ai/gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2024-04-04", - "last_updated": "2024-04-04", + "knowledge": "2025-06", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0 + }, + "limit": { + "context": 1000000, + "output": 65536 + } + }, + { + "id": "302ai/gemini-3-pro-image-preview", + "name": "gemini-3-pro-image-preview", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0 + "input": 2.0, + "output": 120.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 64000 } }, { - "id": "amazon-bedrock/cohere.command-r-v1:0", - "name": "Command R", - "family": "command-r", - "attachment": false, + "id": "302ai/gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2024-03-11", - "last_updated": "2024-03-11", + "knowledge": "2025-06", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.5, - "output": 1.5 + "input": 2.0, + "output": 12.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 64000 } }, { - "id": "amazon-bedrock/cohere.command-text-v14", - "name": "Command", - "family": "command", + "id": "302ai/glm-4.5", + "name": "GLM-4.5", "attachment": false, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-08", - "release_date": "2023-11-01", - "last_updated": "2023-11-01", + "knowledge": "2024-10", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "modalities": { "input": [ "text" @@ -917,30 +852,30 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 1.5, - "output": 2.0 + "input": 0.286, + "output": 1.142 }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 98304 } }, { - "id": "amazon-bedrock/deepseek.r1-v1:0", - "name": "DeepSeek-R1", - "family": "deepseek-thinking", - "attachment": false, - "reasoning": true, + "id": "302ai/glm-4.5v", + "name": "GLM-4.5V", + "attachment": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "knowledge": "2024-10", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -948,25 +883,24 @@ }, "open_weights": false, "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.29, + "output": 0.86 }, "limit": { - "context": 128000, - "output": 32768 + "context": 64000, + "output": 16384 } }, { - "id": "amazon-bedrock/deepseek.v3-v1:0", - "name": "DeepSeek-V3.1", - "family": "deepseek", + "id": "302ai/glm-4.6", + "name": "glm-4.6", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "knowledge": "2025-03", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ "text" @@ -975,32 +909,30 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.58, - "output": 1.68 + "input": 0.286, + "output": 1.142 }, "limit": { - "context": 163840, - "output": 81920 + "context": 200000, + "output": 131072 } }, { - "id": "amazon-bedrock/eu.anthropic.claude-haiku-4.5-20251001-v1:0", - "name": "Claude Haiku 4.5 (EU)", - "family": "claude-haiku", + "id": "302ai/glm-4.6v", + "name": "GLM-4.6V", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-03", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1008,32 +940,27 @@ }, "open_weights": false, "cost": { - "input": 1.0, - "output": 5.0, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.145, + "output": 0.43 }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 } }, { - "id": "amazon-bedrock/eu.anthropic.claude-opus-4.5-20251101-v1:0", - "name": "Claude Opus 4.5 (EU)", - "family": "claude-opus", - "attachment": true, - "reasoning": true, + "id": "302ai/glm-4.7", + "name": "glm-4.7", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2025-06", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -1041,32 +968,29 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.286, + "output": 1.142 }, "limit": { "context": 200000, - "output": 64000 + "output": 131072 } }, { - "id": "amazon-bedrock/eu.anthropic.claude-opus-4.6-v1", - "name": "Claude Opus 4.6 (EU)", - "family": "claude-opus", + "id": "302ai/gpt-4.1", + "name": "gpt-4.1", + "family": "gpt", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1074,32 +998,29 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 2.0, + "output": 8.0 }, "limit": { "context": 1000000, - "output": 128000 + "output": 32768 } }, { - "id": "amazon-bedrock/eu.anthropic.claude-sonnet-4-20250514-v1:0", - "name": "Claude Sonnet 4 (EU)", - "family": "claude-sonnet", + "id": "302ai/gpt-4.1-mini", + "name": "gpt-4.1-mini", + "family": "gpt-mini", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1107,32 +1028,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.4, + "output": 1.6 }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 32768 } }, { - "id": "amazon-bedrock/eu.anthropic.claude-sonnet-4.5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (EU)", - "family": "claude-sonnet", + "id": "302ai/gpt-4.1-nano", + "name": "gpt-4.1-nano", + "family": "gpt-nano", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1140,32 +1058,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.1, + "output": 0.4 }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 32768 } }, { - "id": "amazon-bedrock/global.anthropic.claude-haiku-4.5-20251001-v1:0", - "name": "Claude Haiku 4.5 (Global)", - "family": "claude-haiku", + "id": "302ai/gpt-4o", + "name": "gpt-4o", + "family": "gpt", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1173,32 +1088,28 @@ }, "open_weights": false, "cost": { - "input": 1.0, - "output": 5.0, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 2.5, + "output": 10.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 } }, { - "id": "amazon-bedrock/global.anthropic.claude-opus-4.5-20251101-v1:0", - "name": "Claude Opus 4.5 (Global)", - "family": "claude-opus", + "id": "302ai/gpt-5", + "name": "gpt-5", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2024-10", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1206,32 +1117,28 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.25, + "output": 10.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 } }, { - "id": "amazon-bedrock/global.anthropic.claude-opus-4.6-v1", - "name": "Claude Opus 4.6 (Global)", - "family": "claude-opus", + "id": "302ai/gpt-5-mini", + "name": "gpt-5-mini", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-10", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1239,32 +1146,28 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.25, + "output": 2.0 }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 } }, { - "id": "amazon-bedrock/global.anthropic.claude-sonnet-4-20250514-v1:0", - "name": "Claude Sonnet 4 (Global)", - "family": "claude-sonnet", + "id": "302ai/gpt-5-pro", + "name": "gpt-5-pro", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-10", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1272,32 +1175,28 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 15.0, + "output": 120.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 272000 } }, { - "id": "amazon-bedrock/global.anthropic.claude-sonnet-4.5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (Global)", - "family": "claude-sonnet", + "id": "302ai/gpt-5-thinking", + "name": "gpt-5-thinking", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-10", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1305,27 +1204,24 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.25, + "output": 10.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 } }, { - "id": "amazon-bedrock/google.gemma-3-12b-it", - "name": "Google Gemma 3 12B", - "family": "gemma", - "attachment": false, + "id": "302ai/gpt-5.1", + "name": "gpt-5.1", + "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-10", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "modalities": { "input": [ "text", @@ -1337,25 +1233,24 @@ }, "open_weights": false, "cost": { - "input": 0.049999999999999996, - "output": 0.09999999999999999 + "input": 1.25, + "output": 10.0 }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 } }, { - "id": "amazon-bedrock/google.gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "family": "gemma", + "id": "302ai/gpt-5.1-chat", + "name": "gpt-5.1-chat-latest", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-07-27", - "last_updated": "2025-07-27", + "knowledge": "2024-10", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "modalities": { "input": [ "text", @@ -1365,26 +1260,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.12, - "output": 0.2 + "input": 1.25, + "output": 10.0 }, "limit": { - "context": 202752, - "output": 8192 + "context": 128000, + "output": 16384 } }, { - "id": "amazon-bedrock/google.gemma-3-4b-it", - "name": "Gemma 3 4B IT", - "family": "gemma", - "attachment": false, + "id": "302ai/gpt-5.2", + "name": "gpt-5.2", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-10", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "modalities": { "input": [ "text", @@ -1396,83 +1291,82 @@ }, "open_weights": false, "cost": { - "input": 0.04, - "output": 0.08 + "input": 1.75, + "output": 14.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 } }, { - "id": "amazon-bedrock/meta.llama3-1-70b-instruct-v1:0", - "name": "Llama 3.1 70B Instruct", - "family": "llama", - "attachment": false, + "id": "302ai/gpt-5.2-chat", + "name": "gpt-5.2-chat-latest", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-10", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.72, - "output": 0.72 + "input": 1.75, + "output": 14.0 }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 } }, { - "id": "amazon-bedrock/meta.llama3-1-8b-instruct-v1:0", - "name": "Llama 3.1 8B Instruct", - "family": "llama", - "attachment": false, - "reasoning": false, + "id": "302ai/grok-4-fast", + "name": "grok-4-fast-reasoning", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.22, - "output": 0.22 + "input": 0.2, + "output": 0.5 }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 30000 } }, { - "id": "amazon-bedrock/meta.llama3-2-11b-instruct-v1:0", - "name": "Llama 3.2 11B Instruct", - "family": "llama", + "id": "302ai/grok-4-fast-non", + "name": "grok-4-fast-non-reasoning", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "modalities": { "input": [ "text", @@ -1482,85 +1376,84 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.16, - "output": 0.16 + "input": 0.2, + "output": 0.5 }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 30000 } }, { - "id": "amazon-bedrock/meta.llama3-2-1b-instruct-v1:0", - "name": "Llama 3.2 1B Instruct", - "family": "llama", - "attachment": false, + "id": "302ai/grok-4.1", + "name": "grok-4.1", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2025-06", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.1, - "output": 0.1 + "input": 2.0, + "output": 10.0 }, "limit": { - "context": 131000, - "output": 4096 + "context": 200000, + "output": 64000 } }, { - "id": "amazon-bedrock/meta.llama3-2-3b-instruct-v1:0", - "name": "Llama 3.2 3B Instruct", - "family": "llama", - "attachment": false, - "reasoning": false, + "id": "302ai/grok-4.1-fast", + "name": "grok-4-1-fast-reasoning", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.2, + "output": 0.5 }, "limit": { - "context": 131000, - "output": 4096 + "context": 2000000, + "output": 30000 } }, { - "id": "amazon-bedrock/meta.llama3-2-90b-instruct-v1:0", - "name": "Llama 3.2 90B Instruct", - "family": "llama", + "id": "302ai/grok-4.1-fast-non", + "name": "grok-4-1-fast-non-reasoning", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "modalities": { "input": [ "text", @@ -1570,27 +1463,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.2, + "output": 0.5 }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 30000 } }, { - "id": "amazon-bedrock/meta.llama3-3-70b-instruct-v1:0", - "name": "Llama 3.3 70B Instruct", - "family": "llama", + "id": "302ai/kimi-k2-0905-preview", + "name": "kimi-k2-0905-preview", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "modalities": { "input": [ "text" @@ -1599,27 +1491,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.632, + "output": 2.53 }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 } }, { - "id": "amazon-bedrock/meta.llama3-70b-instruct-v1:0", - "name": "Llama 3 70B Instruct", - "family": "llama", + "id": "302ai/kimi-k2-thinking", + "name": "kimi-k2-thinking", "attachment": false, - "reasoning": false, - "tool_call": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "modalities": { "input": [ "text" @@ -1628,27 +1519,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 2.65, - "output": 3.5 + "input": 0.575, + "output": 2.3 }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 262144 } }, { - "id": "amazon-bedrock/meta.llama3-8b-instruct-v1:0", - "name": "Llama 3 8B Instruct", - "family": "llama", + "id": "302ai/kimi-k2-thinking-turbo", + "name": "kimi-k2-thinking-turbo", "attachment": false, - "reasoning": false, - "tool_call": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2023-03", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "modalities": { "input": [ "text" @@ -1657,27 +1547,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.3, - "output": 0.6 + "input": 1.265, + "output": 9.119 }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 262144 } }, { - "id": "amazon-bedrock/meta.llama4-maverick-17b-instruct-v1:0", - "name": "Llama 4 Maverick 17B Instruct", - "family": "llama", + "id": "302ai/ministral-14b", + "name": "ministral-14b-2512", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "modalities": { "input": [ "text", @@ -1687,27 +1576,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.24, - "output": 0.97 + "input": 0.33, + "output": 0.33 }, "limit": { - "context": 1000000, - "output": 16384 + "context": 128000, + "output": 128000 } }, { - "id": "amazon-bedrock/meta.llama4-scout-17b-instruct-v1:0", - "name": "Llama 4 Scout 17B Instruct", - "family": "llama", + "id": "302ai/mistral-large", + "name": "mistral-large-2512", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "modalities": { "input": [ "text", @@ -1717,26 +1605,25 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.17, - "output": 0.66 + "input": 1.1, + "output": 3.3 }, "limit": { - "context": 3500000, - "output": 16384 + "context": 128000, + "output": 262144 } }, { - "id": "amazon-bedrock/minimax.minimax-m2", - "name": "MiniMax M2", - "family": "minimax", + "id": "302ai/qwen-flash", + "name": "Qwen-Flash", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -1745,26 +1632,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.022, + "output": 0.22 }, "limit": { - "context": 204608, - "output": 128000 + "context": 1000000, + "output": 32768 } }, { - "id": "amazon-bedrock/minimax.minimax-m2.1", - "name": "MiniMax M2.1", - "family": "minimax", + "id": "302ai/qwen-max", + "name": "Qwen-Max-Latest", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2024-11", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "modalities": { "input": [ "text" @@ -1773,26 +1661,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.343, + "output": 1.372 }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 } }, { - "id": "amazon-bedrock/mistral.ministral-3-14b-instruct", - "name": "Ministral 14B 3.0", - "family": "ministral", + "id": "302ai/qwen-plus", + "name": "Qwen-Plus", + "family": "qwen", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-10", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "modalities": { "input": [ "text" @@ -1803,24 +1692,25 @@ }, "open_weights": false, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.12, + "output": 1.2 }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 32768 } }, { - "id": "amazon-bedrock/mistral.ministral-3-8b-instruct", - "name": "Ministral 3 8B", - "family": "ministral", + "id": "302ai/qwen3-235b-a22b", + "name": "Qwen3-235B-A22B", + "family": "qwen", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "modalities": { "input": [ "text" @@ -1831,24 +1721,24 @@ }, "open_weights": false, "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.29, + "output": 2.86 }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 } }, { - "id": "amazon-bedrock/mistral.mistral-7b-instruct-v0:2", - "name": "Mistral-7B-Instruct-v0.3", - "family": "mistral", + "id": "302ai/qwen3-235b-a22b-instruct", + "name": "qwen3-235b-a22b-instruct-2507", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "modalities": { "input": [ "text" @@ -1857,26 +1747,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.29, + "output": 1.143 }, "limit": { - "context": 127000, - "output": 127000 + "context": 128000, + "output": 65536 } }, { - "id": "amazon-bedrock/mistral.mistral-large-2402-v1:0", - "name": "Mistral Large (24.02)", - "family": "mistral-large", + "id": "302ai/qwen3-30b-a3b", + "name": "Qwen3-30B-A3B", + "family": "qwen", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "modalities": { "input": [ "text" @@ -1887,24 +1778,24 @@ }, "open_weights": false, "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.11, + "output": 1.08 }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 } }, { - "id": "amazon-bedrock/mistral.mixtral-8x7b-instruct-v0:1", - "name": "Mixtral-8x7B-Instruct-v0.1", - "family": "mixtral", + "id": "302ai/qwen3-coder-480b-a35b-instruct", + "name": "qwen3-coder-480b-a35b-instruct", "attachment": false, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "modalities": { "input": [ "text" @@ -1913,29 +1804,28 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.86, + "output": 3.43 }, "limit": { - "context": 32000, - "output": 32000 + "context": 262144, + "output": 65536 } }, { - "id": "amazon-bedrock/mistral.voxtral-mini-3b", - "name": "Voxtral Mini 3B 2507", - "family": "mistral", + "id": "302ai/qwen3-max", + "name": "qwen3-max-2025-09-23", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "modalities": { "input": [ - "audio", "text" ], "output": [ @@ -1944,28 +1834,27 @@ }, "open_weights": false, "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.86, + "output": 3.43 }, "limit": { - "context": 128000, - "output": 4096 + "context": 258048, + "output": 65536 } }, { - "id": "amazon-bedrock/mistral.voxtral-small-24b", - "name": "Voxtral Small 24B 2507", - "family": "mistral", - "attachment": true, - "reasoning": false, + "id": "abacus/Qwen/QwQ-32B", + "name": "QwQ 32B", + "family": "qwen", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2024-11-28", + "last_updated": "2024-11-28", "modalities": { "input": [ - "text", - "audio" + "text" ], "output": [ "text" @@ -1973,23 +1862,24 @@ }, "open_weights": true, "cost": { - "input": 0.15, - "output": 0.35 + "input": 0.4, + "output": 0.4 }, "limit": { - "context": 32000, - "output": 8192 + "context": 32768, + "output": 32768 } }, { - "id": "amazon-bedrock/moonshot.kimi-k2-thinking", - "name": "Kimi K2 Thinking", + "id": "abacus/Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen 2.5 72B Instruct", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "modalities": { "input": [ "text" @@ -2000,27 +1890,27 @@ }, "open_weights": true, "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.11, + "output": 0.38 }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 8192 } }, { - "id": "amazon-bedrock/moonshotai.kimi-k2.5", - "name": "Kimi K2.5", + "id": "abacus/Qwen/Qwen3-235B-A22B-Instruct", + "name": "Qwen3 235B A22B Instruct", + "family": "qwen", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -2028,53 +1918,52 @@ }, "open_weights": true, "cost": { - "input": 0.6, - "output": 3.0 + "input": 0.13, + "output": 0.6 }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 8192 } }, { - "id": "amazon-bedrock/nvidia.nemotron-nano-12b-v2", - "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", - "family": "nemotron", + "id": "abacus/Qwen/Qwen3-32B", + "name": "Qwen3 32B", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.09, + "output": 0.29 }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 } }, { - "id": "amazon-bedrock/nvidia.nemotron-nano-9b-v2", - "name": "NVIDIA Nemotron Nano 9B v2", - "family": "nemotron", + "id": "abacus/Qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "modalities": { "input": [ "text" @@ -2083,29 +1972,32 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.06, - "output": 0.23 + "input": 0.29, + "output": 1.2 }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 } }, { - "id": "amazon-bedrock/openai.gpt-oss-120b-1:0", - "name": "gpt-oss-120b", - "family": "gpt-oss", - "attachment": false, - "reasoning": false, + "id": "abacus/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -2113,27 +2005,30 @@ }, "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6 + "input": 3.0, + "output": 15.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 } }, { - "id": "amazon-bedrock/openai.gpt-oss-20b-1:0", - "name": "gpt-oss-20b", - "family": "gpt-oss", - "attachment": false, - "reasoning": false, + "id": "abacus/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -2141,27 +2036,29 @@ }, "open_weights": false, "cost": { - "input": 0.07, - "output": 0.3 + "input": 1.0, + "output": 5.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 } }, { - "id": "amazon-bedrock/openai.gpt-oss-safeguard-120b", - "name": "GPT OSS Safeguard 120B", - "family": "gpt-oss", - "attachment": false, - "reasoning": false, + "id": "abacus/claude-opus-4", + "name": "Claude Opus 4", + "family": "claude-opus", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -2169,27 +2066,29 @@ }, "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6 + "input": 15.0, + "output": 75.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 } }, { - "id": "amazon-bedrock/openai.gpt-oss-safeguard-20b", - "name": "GPT OSS Safeguard 20B", - "family": "gpt-oss", - "attachment": false, - "reasoning": false, + "id": "abacus/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -2197,86 +2096,91 @@ }, "open_weights": false, "cost": { - "input": 0.07, - "output": 0.2 + "input": 15.0, + "output": 75.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 } }, { - "id": "amazon-bedrock/qwen.qwen3-235b-a22b-2507-v1:0", - "name": "Qwen3 235B A22B 2507", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "abacus/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.22, - "output": 0.88 + "input": 5.0, + "output": 25.0 }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 64000 } }, { - "id": "amazon-bedrock/qwen.qwen3-32b-v1:0", - "name": "Qwen3 32B (dense)", - "family": "qwen", - "attachment": false, + "id": "abacus/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6 + "input": 3.0, + "output": 15.0 }, "limit": { - "context": 16384, - "output": 16384 + "context": 200000, + "output": 64000 } }, { - "id": "amazon-bedrock/qwen.qwen3-coder-30b-a3b-v1:0", - "name": "Qwen3 Coder 30B A3B Instruct", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "abacus/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -2284,25 +2188,24 @@ }, "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6 + "input": 3.0, + "output": 15.0 }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 64000 } }, { - "id": "amazon-bedrock/qwen.qwen3-coder-480b-a35b-v1:0", - "name": "Qwen3 Coder 480B A35B Instruct", - "family": "qwen", + "id": "abacus/deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "family": "deepseek-thinking", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "modalities": { "input": [ "text" @@ -2313,24 +2216,24 @@ }, "open_weights": true, "cost": { - "input": 0.22, - "output": 1.8 + "input": 3.0, + "output": 7.0 }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 8192 } }, { - "id": "amazon-bedrock/qwen.qwen3-next-80b-a3b", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "family": "qwen", + "id": "abacus/deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "family": "deepseek", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "modalities": { "input": [ "text" @@ -2339,94 +2242,88 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.27, + "output": 1.0 }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 8192 } }, { - "id": "amazon-bedrock/qwen.qwen3-vl-235b-a22b", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "family": "qwen", - "attachment": true, - "reasoning": false, + "id": "abacus/deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.27, + "output": 0.4 }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 8192 } }, { - "id": "amazon-bedrock/us.anthropic.claude-haiku-4.5-20251001-v1:0", - "name": "Claude Haiku 4.5 (US)", - "family": "claude-haiku", - "attachment": true, + "id": "abacus/deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.0, - "output": 5.0, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.14, + "output": 0.28 }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 } }, { - "id": "amazon-bedrock/us.anthropic.claude-opus-4-20250514-v1:0", - "name": "Claude Opus 4 (US)", - "family": "claude-opus", + "id": "abacus/gemini-2.0-flash-001", + "name": "Gemini 2.0 Flash", + "family": "gemini-flash", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ "text" @@ -2434,64 +2331,59 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.1, + "output": 0.4 }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 8192 } }, { - "id": "amazon-bedrock/us.anthropic.claude-opus-4.1-20250805-v1:0", - "name": "Claude Opus 4.1 (US)", - "family": "claude-opus", + "id": "abacus/gemini-2.0-pro-exp-02-05", + "name": "Gemini 2.0 Pro Exp", + "family": "gemini-pro", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ "text" ] }, "open_weights": false, - "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 - }, + "cost": {}, "limit": { - "context": 200000, - "output": 32000 + "context": 2000000, + "output": 8192 } }, { - "id": "amazon-bedrock/us.anthropic.claude-opus-4.5-20251101-v1:0", - "name": "Claude Opus 4.5 (US)", - "family": "claude-opus", + "id": "abacus/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -2500,31 +2392,31 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 2.5 }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 } }, { - "id": "amazon-bedrock/us.anthropic.claude-opus-4.6-v1", - "name": "Claude Opus 4.6 (US)", - "family": "claude-opus", + "id": "abacus/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -2533,31 +2425,31 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.25, + "output": 10.0 }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 65536 } }, { - "id": "amazon-bedrock/us.anthropic.claude-sonnet-4-20250514-v1:0", - "name": "Claude Sonnet 4 (US)", - "family": "claude-sonnet", + "id": "abacus/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "family": "gemini-flash", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -2566,32 +2458,30 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.5, + "output": 3.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 } }, { - "id": "amazon-bedrock/us.anthropic.claude-sonnet-4.5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (US)", - "family": "claude-sonnet", + "id": "abacus/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ "text" @@ -2599,29 +2489,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 2.0, + "output": 12.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 65000 } }, { - "id": "amazon-bedrock/writer.palmyra-x4-v1:0", - "name": "Palmyra X4", - "family": "palmyra", - "attachment": false, - "reasoning": true, + "id": "abacus/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -2629,27 +2519,29 @@ }, "open_weights": false, "cost": { - "input": 2.5, - "output": 10.0 + "input": 2.0, + "output": 8.0 }, "limit": { - "context": 122880, - "output": 8192 + "context": 1047576, + "output": 32768 } }, { - "id": "amazon-bedrock/writer.palmyra-x5-v1:0", - "name": "Palmyra X5", - "family": "palmyra", - "attachment": false, - "reasoning": true, + "id": "abacus/gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "family": "gpt", + "attachment": true, + "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -2657,88 +2549,90 @@ }, "open_weights": false, "cost": { - "input": 0.6, - "output": 6.0 + "input": 0.4, + "output": 1.6 }, "limit": { - "context": 1040000, - "output": 8192 + "context": 1047576, + "output": 32768 } }, { - "id": "amazon-bedrock/zai.glm-4.7", - "name": "GLM-4.7", - "family": "glm", - "attachment": false, - "reasoning": true, + "id": "abacus/gpt-4.1-nano", + "name": "GPT-4.1 Nano", + "family": "gpt", + "attachment": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.1, + "output": 0.4 }, "limit": { - "context": 204800, - "output": 131072 + "context": 1047576, + "output": 32768 } }, { - "id": "amazon-bedrock/zai.glm-4.7-flash", - "name": "GLM-4.7-Flash", - "family": "glm-flash", - "attachment": false, - "reasoning": true, + "id": "abacus/gpt-4o", + "name": "GPT-4o (2024-11-20)", + "family": "gpt", + "attachment": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2024-10", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.07, - "output": 0.4 + "input": 2.5, + "output": 10.0 }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 16384 } }, { - "id": "anthropic/claude-3-haiku", - "name": "Claude Haiku 3", - "family": "claude-haiku", + "id": "abacus/gpt-4o-mini", + "name": "GPT-4o Mini", + "family": "gpt", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2024-04", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -2746,32 +2640,29 @@ }, "open_weights": false, "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.15, + "output": 0.6 }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 16384 } }, { - "id": "anthropic/claude-3-opus", - "name": "Claude Opus 3", - "family": "claude-opus", + "id": "abacus/gpt-5", + "name": "GPT-5", + "family": "gpt", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -2779,32 +2670,29 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.25, + "output": 10.0 }, "limit": { - "context": 200000, - "output": 4096 + "context": 400000, + "output": 128000 } }, { - "id": "anthropic/claude-3-sonnet", - "name": "Claude Sonnet 3", - "family": "claude-sonnet", + "id": "abacus/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -2812,32 +2700,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 0.3 + "input": 0.25, + "output": 2.0 }, "limit": { - "context": 200000, - "output": 4096 + "context": 400000, + "output": 128000 } }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5", - "family": "claude-haiku", + "id": "abacus/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -2845,32 +2730,29 @@ }, "open_weights": false, "cost": { - "input": 0.8, - "output": 4.0, - "cache_read": 0.08, - "cache_write": 1.0 + "input": 0.05, + "output": 0.4 }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 } }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5", - "family": "claude-sonnet", + "id": "abacus/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-04-30", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -2878,32 +2760,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.25, + "output": 10.0 }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 } }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "Claude Sonnet 3.7", - "family": "claude-sonnet", + "id": "abacus/gpt-5.1-chat", + "name": "GPT-5.1 Chat Latest", + "family": "gpt", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -2911,32 +2790,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.25, + "output": 10.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 } }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude Haiku 4.5 (latest)", - "family": "claude-haiku", + "id": "abacus/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -2944,32 +2820,29 @@ }, "open_weights": false, "cost": { - "input": 1.0, - "output": 5.0, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 1.75, + "output": 14.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 } }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "family": "claude-opus", + "id": "abacus/gpt-5.2-chat", + "name": "GPT-5.2 Chat Latest", + "family": "gpt", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-09-30", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -2977,32 +2850,28 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.5, + "output": 12.0 }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 } }, { - "id": "anthropic/claude-opus-4.0", - "name": "Claude Opus 4 (latest)", - "family": "claude-opus", + "id": "abacus/grok-4", + "name": "Grok 4", + "family": "grok", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -3010,32 +2879,28 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 3.0, + "output": 15.0 }, "limit": { - "context": 200000, - "output": 32000 + "context": 256000, + "output": 16384 } }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1", - "family": "claude-opus", + "id": "abacus/grok-4-fast-non", + "name": "Grok 4 Fast (Non-Reasoning)", + "family": "grok", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -3043,32 +2908,28 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.2, + "output": 0.5 }, "limit": { - "context": 200000, - "output": 32000 + "context": 2000000, + "output": 16384 } }, { - "id": "anthropic/claude-opus-4.5", - "name": "Claude Opus 4.5 (latest)", - "family": "claude-opus", + "id": "abacus/grok-4.1-fast-non", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "family": "grok", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -3076,32 +2937,28 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.2, + "output": 0.5 }, "limit": { - "context": 200000, - "output": 64000 + "context": 2000000, + "output": 16384 } }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude Opus 4.6", - "family": "claude-opus", + "id": "abacus/grok-code-fast-1", + "name": "Grok Code Fast 1", + "family": "grok", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -3109,32 +2966,27 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.2, + "output": 1.5 }, "limit": { - "context": 200000, - "output": 128000 + "context": 256000, + "output": 16384 } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "family": "claude-sonnet", - "attachment": true, - "reasoning": true, + "id": "abacus/kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo Preview", + "family": "kimi", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -3142,197 +2994,171 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.15, + "output": 8.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 8192 } }, { - "id": "anthropic/claude-sonnet-4.0", - "name": "Claude Sonnet 4 (latest)", - "family": "claude-sonnet", - "attachment": true, - "reasoning": true, + "id": "abacus/llama-3.3-70b-versatile", + "name": "Llama 3.3 70B Versatile", + "family": "llama", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.59, + "output": 0.79 }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 } }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5 (latest)", - "family": "claude-sonnet", + "id": "abacus/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "family": "llama", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.14, + "output": 0.59 }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 32768 } }, { - "id": "azure/claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "family": "claude-haiku", - "attachment": true, - "reasoning": true, + "id": "abacus/meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", + "name": "Llama 3.1 405B Instruct Turbo", + "family": "llama", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.0, - "output": 5.0, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 3.5, + "output": 3.5 }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 } }, { - "id": "azure/claude-opus-4.1", - "name": "Claude Opus 4.1", - "family": "claude-opus", - "attachment": true, - "reasoning": true, + "id": "abacus/meta-llama/Meta-Llama-3.1-70B-Instruct", + "name": "Llama 3.1 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.4, + "output": 0.4 }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 4096 } }, { - "id": "azure/claude-opus-4.5", - "name": "Claude Opus 4.5", - "family": "claude-opus", - "attachment": true, - "reasoning": true, + "id": "abacus/meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.02, + "output": 0.05 }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 } }, { - "id": "azure/claude-opus-4.6", - "name": "Claude Opus 4.6", - "family": "claude-opus", + "id": "abacus/o3", + "name": "o3", + "family": "o", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -3340,32 +3166,28 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 2.0, + "output": 8.0 }, "limit": { "context": 200000, - "output": 128000 + "output": 100000 } }, { - "id": "azure/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "family": "claude-sonnet", - "attachment": true, + "id": "abacus/o3-mini", + "name": "o3-mini", + "family": "o-mini", + "attachment": false, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "temperature": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -3373,30 +3195,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.1, + "output": 4.4 }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 } }, { - "id": "azure/codestral", - "name": "Codestral 25.01", - "family": "codestral", - "attachment": false, - "reasoning": false, + "id": "abacus/o3-pro", + "name": "o3-pro", + "family": "o-pro", + "attachment": true, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -3404,28 +3225,29 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 0.9 + "input": 20.0, + "output": 80.0 }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 100000 } }, { - "id": "azure/codex-mini", - "name": "Codex Mini", - "family": "gpt-codex-mini", + "id": "abacus/o4-mini", + "name": "o4-mini", + "family": "o-mini", "attachment": true, "reasoning": true, "tool_call": true, "temperature": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -3433,9 +3255,8 @@ }, "open_weights": false, "cost": { - "input": 1.5, - "output": 6.0, - "cache_read": 0.375 + "input": 1.1, + "output": 4.4 }, "limit": { "context": 200000, @@ -3443,19 +3264,19 @@ } }, { - "id": "azure/cohere-command-a", - "name": "Command A", - "family": "command-a", - "attachment": false, + "id": "abacus/openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "family": "gpt-oss", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -3463,25 +3284,24 @@ }, "open_weights": true, "cost": { - "input": 2.5, - "output": 10.0 + "input": 0.08, + "output": 0.44 }, "limit": { - "context": 256000, - "output": 8000 + "context": 128000, + "output": 32768 } }, { - "id": "azure/cohere-command-r-08", - "name": "Command R", - "family": "command-r", + "id": "abacus/qwen-2.5-coder-32b", + "name": "Qwen 2.5 Coder 32B", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", "modalities": { "input": [ "text" @@ -3492,25 +3312,24 @@ }, "open_weights": true, "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.79, + "output": 0.79 }, "limit": { "context": 128000, - "output": 4000 + "output": 8192 } }, { - "id": "azure/cohere-command-r-plus-08", - "name": "Command R+", - "family": "command-r", + "id": "abacus/qwen3-max", + "name": "Qwen3 Max", + "family": "qwen", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "modalities": { "input": [ "text" @@ -3519,26 +3338,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 2.5, - "output": 10.0 + "input": 1.2, + "output": 6.0 }, "limit": { - "context": 128000, - "output": 4000 + "context": 131072, + "output": 16384 } }, { - "id": "azure/cohere-embed-v-4.0", - "name": "Embed v4", - "family": "cohere-embed", + "id": "abacus/route-llm", + "name": "Route LLM", + "family": "gpt", "attachment": true, "reasoning": false, - "tool_call": false, - "temperature": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "modalities": { "input": [ "text", @@ -3548,26 +3368,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.12, - "output": 0.0 + "input": 0.5, + "output": 1.5 }, "limit": { "context": 128000, - "output": 1536 + "output": 16384 } }, { - "id": "azure/cohere-embed-v3-english", - "name": "Embed v3 English", - "family": "cohere-embed", + "id": "abacus/zai-org/glm-4.5", + "name": "GLM-4.5", + "family": "glm", "attachment": false, - "reasoning": false, - "tool_call": false, - "temperature": false, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -3578,24 +3398,24 @@ }, "open_weights": true, "cost": { - "input": 0.1, - "output": 0.0 + "input": 0.6, + "output": 2.2 }, "limit": { - "context": 512, - "output": 1024 + "context": 128000, + "output": 8192 } }, { - "id": "azure/cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "family": "cohere-embed", + "id": "abacus/zai-org/glm-4.6", + "name": "GLM-4.6", + "family": "glm", "attachment": false, "reasoning": false, - "tool_call": false, - "temperature": false, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "tool_call": true, + "temperature": true, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "modalities": { "input": [ "text" @@ -3606,25 +3426,24 @@ }, "open_weights": true, "cost": { - "input": 0.1, - "output": 0.0 + "input": 0.6, + "output": 2.2 }, "limit": { - "context": 512, - "output": 1024 + "context": 128000, + "output": 8192 } }, { - "id": "azure/deepseek-r1", - "name": "DeepSeek-R1", - "family": "deepseek-thinking", + "id": "abacus/zai-org/glm-4.7", + "name": "GLM-4.7", + "family": "glm", "attachment": false, - "reasoning": true, - "tool_call": false, + "reasoning": false, + "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "modalities": { "input": [ "text" @@ -3635,25 +3454,25 @@ }, "open_weights": true, "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.7, + "output": 2.5 }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 8192 } }, { - "id": "azure/deepseek-v3", - "name": "DeepSeek-V3-0324", - "family": "deepseek", + "id": "aihubmix/Kimi-K2", + "name": "Kimi K2 0905", + "family": "kimi", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "modalities": { "input": [ "text" @@ -3664,115 +3483,127 @@ }, "open_weights": true, "cost": { - "input": 1.14, - "output": 4.56 + "input": 0.55, + "output": 2.19 }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 } }, { - "id": "azure/deepseek-v3.1", - "name": "DeepSeek-V3.1", - "family": "deepseek", - "attachment": false, + "id": "aihubmix/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.56, - "output": 1.68 + "input": 1.1, + "output": 5.5, + "cache_read": 0.11, + "cache_write": 1.25 }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 } }, { - "id": "azure/deepseek-v3.2", - "name": "DeepSeek-V3.2", - "family": "deepseek", - "attachment": false, + "id": "aihubmix/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.58, - "output": 1.68 + "input": 16.5, + "output": 82.5, + "cache_read": 1.5, + "cache_write": 18.75 }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 32000 } }, { - "id": "azure/deepseek-v3.2-speciale", - "name": "DeepSeek-V3.2-Speciale", - "family": "deepseek", - "attachment": false, + "id": "aihubmix/claude-opus-4.5", + "name": "Claude Opus 4.5", + "attachment": true, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2025-03", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.58, - "output": 1.68 + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 32000 } }, { - "id": "azure/gpt-3.5-turbo", - "name": "GPT-3.5 Turbo 1106", - "family": "gpt", - "attachment": false, - "reasoning": false, - "tool_call": false, + "id": "aihubmix/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -3780,28 +3611,32 @@ }, "open_weights": false, "cost": { - "input": 1.0, - "output": 2.0 + "input": 5.0, + "output": 25.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 16384, - "output": 16384 + "context": 200000, + "output": 128000 } }, { - "id": "azure/gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "family": "gpt", - "attachment": false, - "reasoning": false, - "tool_call": false, + "id": "aihubmix/claude-opus-4.6-think", + "name": "Claude Opus 4.6 Think", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -3809,28 +3644,32 @@ }, "open_weights": false, "cost": { - "input": 1.5, - "output": 2.0 + "input": 5.0, + "output": 25.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 128000 } }, { - "id": "azure/gpt-4", - "name": "GPT-4", - "family": "gpt", - "attachment": false, - "reasoning": false, + "id": "aihubmix/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -3838,28 +3677,32 @@ }, "open_weights": false, "cost": { - "input": 60.0, - "output": 120.0 + "input": 3.3, + "output": 16.5, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 64000 } }, { - "id": "azure/gpt-4-32k", - "name": "GPT-4 32K", - "family": "gpt", - "attachment": false, - "reasoning": false, + "id": "aihubmix/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -3867,29 +3710,32 @@ }, "open_weights": false, "cost": { - "input": 60.0, - "output": 120.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 64000 } }, { - "id": "azure/gpt-4-turbo", - "name": "GPT-4 Turbo", - "family": "gpt", + "id": "aihubmix/claude-sonnet-4.6-think", + "name": "Claude Sonnet 4.6 Think", + "family": "claude-sonnet", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -3897,214 +3743,208 @@ }, "open_weights": false, "cost": { - "input": 10.0, - "output": 30.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 } }, { - "id": "azure/gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "family": "gpt", - "attachment": true, - "reasoning": false, + "id": "aihubmix/coding-glm-4.7", + "name": "Coding-GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 10.0, - "output": 30.0 + "input": 0.27, + "output": 1.1, + "cache_read": 0.548 }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 } }, { - "id": "azure/gpt-4.1", - "name": "GPT-4.1", - "family": "gpt", - "attachment": true, - "reasoning": false, + "id": "aihubmix/coding-glm-4.7-free", + "name": "Coding GLM 4.7 Free", + "family": "glm", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 2.0, - "output": 8.0, - "cache_read": 0.5 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 1047576, - "output": 32768 + "context": 204800, + "output": 131072 } }, { - "id": "azure/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "family": "gpt-mini", - "attachment": true, - "reasoning": false, + "id": "aihubmix/coding-minimax-m2.1-free", + "name": "Coding MiniMax M2.1 Free", + "family": "minimax", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 1047576, - "output": 32768 + "context": 204800, + "output": 131072 } }, { - "id": "azure/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "family": "gpt-nano", - "attachment": true, - "reasoning": false, + "id": "aihubmix/deepseek-v3.2", + "name": "DeepSeek-V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 0.3, + "output": 0.45 }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131000, + "output": 64000 } }, { - "id": "azure/gpt-4o", - "name": "GPT-4o", - "family": "gpt", - "attachment": true, + "id": "aihubmix/deepseek-v3.2-fast", + "name": "DeepSeek-V3.2-Fast", + "family": "deepseek", + "attachment": false, "reasoning": false, - "tool_call": true, - "temperature": true, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "tool_call": false, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 2.5, - "output": 10.0, - "cache_read": 1.25 + "input": 1.1, + "output": 3.29 }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 } }, { - "id": "azure/gpt-4o-mini", - "name": "GPT-4o mini", - "family": "gpt-mini", - "attachment": true, - "reasoning": false, + "id": "aihubmix/deepseek-v3.2-think", + "name": "DeepSeek-V3.2-Think", + "family": "deepseek", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.3, + "output": 0.45 }, "limit": { - "context": 128000, - "output": 16384 + "context": 131000, + "output": 64000 } }, { - "id": "azure/gpt-5", - "name": "GPT-5", - "family": "gpt", + "id": "aihubmix/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" @@ -4112,30 +3952,32 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.13 + "input": 0.075, + "output": 0.3, + "cache_read": 0.02 }, "limit": { - "context": 272000, - "output": 128000 + "context": 1000000, + "output": 65000 } }, { - "id": "azure/gpt-5-chat", - "name": "GPT-5 Chat", - "family": "gpt-codex", + "id": "aihubmix/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", "attachment": true, "reasoning": true, - "tool_call": false, - "temperature": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" @@ -4144,29 +3986,31 @@ "open_weights": false, "cost": { "input": 1.25, - "output": 10.0, - "cache_read": 0.13 + "output": 5.0, + "cache_read": 0.31 }, "limit": { - "context": 128000, - "output": 16384 + "context": 2000000, + "output": 65000 } }, { - "id": "azure/gpt-5-codex", - "name": "GPT-5-Codex", - "family": "gpt-codex", - "attachment": false, + "id": "aihubmix/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" @@ -4174,30 +4018,32 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.13 + "input": 2.0, + "output": 12.0, + "cache_read": 0.5 }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65000 } }, { - "id": "azure/gpt-5-mini", - "name": "GPT-5 Mini", - "family": "gpt-mini", + "id": "aihubmix/gemini-3-pro-preview-search", + "name": "Gemini 3 Pro Preview Search", + "family": "gemini-pro", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" @@ -4205,57 +4051,87 @@ }, "open_weights": false, "cost": { - "input": 0.25, - "output": 2.0, - "cache_read": 0.03 + "input": 2.0, + "output": 12.0, + "cache_read": 0.5 }, "limit": { - "context": 272000, - "output": 128000 + "context": 1000000, + "output": 65000 } }, { - "id": "azure/gpt-5-nano", - "name": "GPT-5 Nano", - "family": "gpt-nano", + "id": "aihubmix/glm-4.6v", + "name": "GLM-4.6V", + "family": "glm", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0.14, + "output": 0.41 }, "limit": { - "context": 272000, - "output": 128000 + "context": 128000, + "output": 32768 } }, { - "id": "azure/gpt-5-pro", - "name": "GPT-5 Pro", - "family": "gpt-pro", - "attachment": true, + "id": "aihubmix/glm-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.1, + "cache_read": 0.548 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "aihubmix/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ "text", @@ -4267,127 +4143,119 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 120.0 + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 }, "limit": { - "context": 400000, - "output": 272000 + "context": 1047576, + "output": 32768 } }, { - "id": "azure/gpt-5.1", - "name": "GPT-5.1", - "family": "gpt", + "id": "aihubmix/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "family": "gpt-mini", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "limit": { - "context": 272000, - "output": 128000 + "context": 1047576, + "output": 32768 } }, { - "id": "azure/gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "family": "gpt-codex", + "id": "aihubmix/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "family": "gpt-nano", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "limit": { - "context": 128000, - "output": 16384 + "context": 1047576, + "output": 32768 } }, { - "id": "azure/gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "family": "gpt-codex", - "attachment": false, - "reasoning": true, + "id": "aihubmix/gpt-4o", + "name": "GPT-4o", + "family": "gpt", + "attachment": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "open_weights": false, "cost": { - "input": 1.25, + "input": 2.5, "output": 10.0, - "cache_read": 0.125 + "cache_read": 1.25 }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 } }, { - "id": "azure/gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "family": "gpt-codex", + "id": "aihubmix/gpt-5", + "name": "GPT-5", + "family": "gpt", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, + "temperature": true, "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ "text", @@ -4399,9 +4267,9 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 5.0, + "output": 20.0, + "cache_read": 2.5 }, "limit": { "context": 400000, @@ -4409,16 +4277,16 @@ } }, { - "id": "azure/gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", + "id": "aihubmix/gpt-5-codex", + "name": "GPT-5-Codex", "family": "gpt-codex", "attachment": false, "reasoning": true, "tool_call": true, "temperature": false, "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ "text", @@ -4430,9 +4298,9 @@ }, "open_weights": false, "cost": { - "input": 0.25, - "output": 2.0, - "cache_read": 0.025 + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 }, "limit": { "context": 400000, @@ -4440,16 +4308,16 @@ } }, { - "id": "azure/gpt-5.2", - "name": "GPT-5.2", - "family": "gpt", + "id": "aihubmix/gpt-5-mini", + "name": "GPT-5-Mini", + "family": "gpt-mini", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ "text", @@ -4461,26 +4329,26 @@ }, "open_weights": false, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.125 + "input": 1.5, + "output": 6.0, + "cache_read": 0.75 }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 } }, { - "id": "azure/gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "family": "gpt-codex", + "id": "aihubmix/gpt-5-nano", + "name": "GPT-5-Nano", + "family": "gpt-nano", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ "text", @@ -4492,9 +4360,9 @@ }, "open_weights": false, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 0.5, + "output": 2.0, + "cache_read": 0.25 }, "limit": { "context": 128000, @@ -4502,16 +4370,16 @@ } }, { - "id": "azure/gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "family": "gpt-codex", - "attachment": false, + "id": "aihubmix/gpt-5-pro", + "name": "GPT-5-Pro", + "family": "gpt-pro", + "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ "text", @@ -4523,9 +4391,9 @@ }, "open_weights": false, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 7.0, + "output": 28.0, + "cache_read": 3.5 }, "limit": { "context": 400000, @@ -4533,19 +4401,20 @@ } }, { - "id": "azure/grok-3", - "name": "Grok 3", - "family": "grok", - "attachment": false, - "reasoning": false, + "id": "aihubmix/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-11", + "release_date": "2025-11-15", + "last_updated": "2025-11-15", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -4553,29 +4422,30 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.75 + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 } }, { - "id": "azure/grok-3-mini", - "name": "Grok 3 Mini", - "family": "grok", - "attachment": false, + "id": "aihubmix/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "family": "gpt-codex", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-11", + "release_date": "2025-11-15", + "last_updated": "2025-11-15", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -4583,29 +4453,29 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 } }, { - "id": "azure/grok-4", - "name": "Grok 4", - "family": "grok", - "attachment": false, + "id": "aihubmix/gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-Max", + "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -4613,26 +4483,26 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.75 + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 }, "limit": { - "context": 256000, - "output": 64000 + "context": 400000, + "output": 128000 } }, { - "id": "azure/grok-4-fast", - "name": "Grok 4 Fast (Reasoning)", - "family": "grok", + "id": "aihubmix/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "family": "gpt-codex", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-11", + "release_date": "2025-11-15", + "last_updated": "2025-11-15", "modalities": { "input": [ "text", @@ -4644,26 +4514,26 @@ }, "open_weights": false, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.25, + "output": 2.0, + "cache_read": 0.03 }, "limit": { - "context": 2000000, - "output": 30000 + "context": 400000, + "output": 128000 } }, { - "id": "azure/grok-4-fast-non", - "name": "Grok 4 Fast (Non-Reasoning)", - "family": "grok", + "id": "aihubmix/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "modalities": { "input": [ "text", @@ -4675,29 +4545,30 @@ }, "open_weights": false, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 }, "limit": { - "context": 2000000, - "output": 30000 + "context": 400000, + "output": 128000 } }, { - "id": "azure/grok-code-fast-1", - "name": "Grok Code Fast 1", - "family": "grok", - "attachment": false, + "id": "aihubmix/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "family": "gpt-codex", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -4705,29 +4576,31 @@ }, "open_weights": false, "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 }, "limit": { - "context": 256000, - "output": 10000 + "context": 400000, + "output": 128000 } }, { - "id": "azure/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "family": "kimi-thinking", - "attachment": false, + "id": "aihubmix/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-12-02", + "knowledge": "2025-07", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -4736,8 +4609,8 @@ "open_weights": true, "cost": { "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "output": 3.0, + "cache_read": 0.1 }, "limit": { "context": 262144, @@ -4745,20 +4618,18 @@ } }, { - "id": "azure/kimi-k2.5", - "name": "Kimi K2.5", - "family": "kimi", + "id": "aihubmix/minimax-m2.1", + "name": "MiniMax M2.1", + "family": "minimax", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -4766,59 +4637,58 @@ }, "open_weights": true, "cost": { - "input": 0.6, - "output": 3.0 + "input": 0.29, + "output": 1.15 }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 } }, { - "id": "azure/llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "family": "llama", - "attachment": true, - "reasoning": false, - "tool_call": true, - "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "id": "aihubmix/o4-mini", + "name": "o4-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2024-09", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.37, - "output": 0.37 + "input": 1.5, + "output": 6.0, + "cache_read": 0.75 }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 65536 } }, { - "id": "azure/llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "family": "llama", - "attachment": true, + "id": "aihubmix/qwen3-235b-a22b-instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -4826,25 +4696,25 @@ }, "open_weights": true, "cost": { - "input": 2.04, - "output": 2.04 + "input": 0.28, + "output": 1.12 }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 } }, { - "id": "azure/llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "family": "llama", + "id": "aihubmix/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "modalities": { "input": [ "text" @@ -4855,85 +4725,81 @@ }, "open_weights": true, "cost": { - "input": 0.71, - "output": 0.71 + "input": 0.28, + "output": 2.8 }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 262144 } }, { - "id": "azure/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "family": "llama", - "attachment": true, + "id": "aihubmix/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.25, - "output": 1.0 + "input": 0.82, + "output": 3.29 }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 131000 } }, { - "id": "azure/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "family": "llama", - "attachment": true, + "id": "aihubmix/qwen3-max", + "name": "Qwen3 Max", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.2, - "output": 0.78 + "input": 0.34, + "output": 1.37 }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 65536 } }, { - "id": "azure/mai-ds-r1", - "name": "MAI-DS-R1", - "family": "mai", + "id": "alibaba-cn/deepseek-r1", + "name": "DeepSeek R1", + "family": "deepseek-thinking", "attachment": false, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "modalities": { "input": [ "text" @@ -4944,25 +4810,24 @@ }, "open_weights": false, "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.574, + "output": 2.294 }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 16384 } }, { - "id": "azure/meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "family": "llama", + "id": "alibaba-cn/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "family": "deepseek-thinking", "attachment": false, - "reasoning": false, - "tool_call": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "modalities": { "input": [ "text" @@ -4971,27 +4836,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 2.68, - "output": 3.54 + "input": 0.287, + "output": 0.861 }, "limit": { - "context": 8192, - "output": 2048 + "context": 32768, + "output": 16384 } }, { - "id": "azure/meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "family": "llama", + "id": "alibaba-cn/deepseek-r1-distill-llama-8b", + "name": "DeepSeek R1 Distill Llama 8B", + "family": "deepseek-thinking", "attachment": false, - "reasoning": false, - "tool_call": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "modalities": { "input": [ "text" @@ -5000,27 +4864,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 8192, - "output": 2048 + "context": 32768, + "output": 16384 } }, { - "id": "azure/meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "family": "llama", + "id": "alibaba-cn/deepseek-r1-distill-qwen-1-5b", + "name": "DeepSeek R1 Distill Qwen 1.5B", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "modalities": { "input": [ "text" @@ -5029,27 +4892,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 5.33, - "output": 16.0 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 16384 } }, { - "id": "azure/meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "family": "llama", + "id": "alibaba-cn/deepseek-r1-distill-qwen-14b", + "name": "DeepSeek R1 Distill Qwen 14B", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "modalities": { "input": [ "text" @@ -5058,27 +4920,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 2.68, - "output": 3.54 + "input": 0.144, + "output": 0.431 }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 16384 } }, { - "id": "azure/meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "family": "llama", + "id": "alibaba-cn/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "modalities": { "input": [ "text" @@ -5087,27 +4948,54 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.287, + "output": 0.861 }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 16384 } }, { - "id": "azure/ministral-3b", - "name": "Ministral 3B", - "family": "ministral", + "id": "alibaba-cn/deepseek-r1-distill-qwen-7b", + "name": "DeepSeek R1 Distill Qwen 7B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.072, + "output": 0.144 + }, + "limit": { + "context": 32768, + "output": 16384 + } + }, + { + "id": "alibaba-cn/deepseek-v3", + "name": "DeepSeek V3", + "family": "deepseek", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "modalities": { "input": [ "text" @@ -5116,27 +5004,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.287, + "output": 1.147 }, "limit": { - "context": 128000, + "context": 65536, "output": 8192 } }, { - "id": "azure/mistral-large", - "name": "Mistral Large 24.11", - "family": "mistral-large", + "id": "alibaba-cn/deepseek-v3-1", + "name": "DeepSeek V3.1", + "family": "deepseek", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "modalities": { "input": [ "text" @@ -5147,29 +5034,27 @@ }, "open_weights": false, "cost": { - "input": 2.0, - "output": 6.0 + "input": 0.574, + "output": 1.721 }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 65536 } }, { - "id": "azure/mistral-medium", - "name": "Mistral Medium 3", - "family": "mistral-medium", - "attachment": true, + "id": "alibaba-cn/deepseek-v3-2-exp", + "name": "DeepSeek V3.2 Exp", + "family": "deepseek", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -5177,25 +5062,24 @@ }, "open_weights": false, "cost": { - "input": 0.4, - "output": 2.0 + "input": 0.287, + "output": 0.431 }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 65536 } }, { - "id": "azure/mistral-nemo", - "name": "Mistral Nemo", - "family": "mistral-nemo", + "id": "alibaba-cn/kimi-k2-thinking", + "name": "Moonshot Kimi K2 Thinking", + "family": "kimi", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "modalities": { "input": [ "text" @@ -5206,25 +5090,24 @@ }, "open_weights": true, "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.574, + "output": 2.294 }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 16384 } }, { - "id": "azure/mistral-small", - "name": "Mistral Small 3.1", - "family": "mistral-small", - "attachment": true, - "reasoning": false, + "id": "alibaba-cn/kimi-k2.5", + "name": "Moonshot Kimi K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "modalities": { "input": [ "text", @@ -5234,55 +5117,55 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.574, + "output": 2.411 }, "limit": { - "context": 128000, + "context": 262144, "output": 32768 } }, { - "id": "azure/model-router", - "name": "Model Router", - "family": "model-router", - "attachment": true, + "id": "alibaba-cn/moonshot-kimi-k2-instruct", + "name": "Moonshot Kimi K2 Instruct", + "family": "kimi", + "attachment": false, "reasoning": false, "tool_call": true, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "temperature": true, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.14, - "output": 0.0 + "input": 0.574, + "output": 2.294 }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 } }, { - "id": "azure/o1", - "name": "o1", - "family": "o", + "id": "alibaba-cn/qvq-max", + "name": "QVQ Max", + "family": "qvq", "attachment": false, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "modalities": { "input": [ "text", @@ -5294,26 +5177,25 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 60.0, - "cache_read": 7.5 + "input": 1.147, + "output": 4.588 }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 } }, { - "id": "azure/o1-mini", - "name": "o1-mini", - "family": "o-mini", + "id": "alibaba-cn/qwen-deep-research", + "name": "Qwen Deep Research", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "modalities": { "input": [ "text" @@ -5324,26 +5206,25 @@ }, "open_weights": false, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 7.742, + "output": 23.367 }, "limit": { - "context": 128000, - "output": 65536 + "context": 1000000, + "output": 32768 } }, { - "id": "azure/o1-preview", - "name": "o1-preview", - "family": "o", + "id": "alibaba-cn/qwen-doc-turbo", + "name": "Qwen Doc Turbo", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "modalities": { "input": [ "text" @@ -5354,30 +5235,28 @@ }, "open_weights": false, "cost": { - "input": 16.5, - "output": 66.0, - "cache_read": 8.25 + "input": 0.087, + "output": 0.144 }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 } }, { - "id": "azure/o3", - "name": "o3", - "family": "o", - "attachment": true, + "id": "alibaba-cn/qwen-flash", + "name": "Qwen Flash", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -5385,26 +5264,25 @@ }, "open_weights": false, "cost": { - "input": 2.0, - "output": 8.0, - "cache_read": 0.5 + "input": 0.022, + "output": 0.216 }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 32768 } }, { - "id": "azure/o3-mini", - "name": "o3-mini", - "family": "o-mini", + "id": "alibaba-cn/qwen-long", + "name": "Qwen Long", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "modalities": { "input": [ "text" @@ -5415,30 +5293,28 @@ }, "open_weights": false, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.072, + "output": 0.287 }, "limit": { - "context": 200000, - "output": 100000 + "context": 10000000, + "output": 8192 } }, { - "id": "azure/o4-mini", - "name": "o4-mini", - "family": "o-mini", - "attachment": true, - "reasoning": true, + "id": "alibaba-cn/qwen-math-plus", + "name": "Qwen Math Plus", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-08-16", + "last_updated": "2024-09-19", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -5446,26 +5322,25 @@ }, "open_weights": false, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.574, + "output": 1.721 }, "limit": { - "context": 200000, - "output": 100000 + "context": 4096, + "output": 3072 } }, { - "id": "azure/phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "family": "phi", + "id": "alibaba-cn/qwen-math-turbo", + "name": "Qwen Math Turbo", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-04", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "modalities": { "input": [ "text" @@ -5474,27 +5349,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.287, + "output": 0.861 }, "limit": { - "context": 128000, - "output": 4096 + "context": 4096, + "output": 3072 } }, { - "id": "azure/phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "family": "phi", + "id": "alibaba-cn/qwen-max", + "name": "Qwen Max", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "modalities": { "input": [ "text" @@ -5503,27 +5378,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.345, + "output": 1.377 }, "limit": { - "context": 4096, - "output": 1024 + "context": 131072, + "output": 8192 } }, { - "id": "azure/phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "family": "phi", + "id": "alibaba-cn/qwen-mt-plus", + "name": "Qwen-MT Plus", + "family": "qwen", "attachment": false, "reasoning": false, "tool_call": false, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "modalities": { "input": [ "text" @@ -5532,27 +5407,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.259, + "output": 0.775 }, "limit": { - "context": 128000, - "output": 4096 + "context": 16384, + "output": 8192 } }, { - "id": "azure/phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "family": "phi", + "id": "alibaba-cn/qwen-mt-turbo", + "name": "Qwen-MT Turbo", + "family": "qwen", "attachment": false, "reasoning": false, "tool_call": false, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "modalities": { "input": [ "text" @@ -5561,85 +5436,92 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.101, + "output": 0.28 }, "limit": { - "context": 4096, - "output": 1024 + "context": 16384, + "output": 8192 } }, { - "id": "azure/phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "family": "phi", + "id": "alibaba-cn/qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.058, + "output": 0.23 }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 2048 } }, { - "id": "azure/phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "family": "phi", + "id": "alibaba-cn/qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.23, + "output": 0.918 }, "limit": { - "context": 8192, + "context": 32768, "output": 2048 } }, { - "id": "azure/phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "family": "phi", + "id": "alibaba-cn/qwen-plus", + "name": "Qwen Plus", + "family": "qwen", "attachment": false, - "reasoning": false, - "tool_call": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "modalities": { "input": [ "text" @@ -5648,27 +5530,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.115, + "output": 0.287 }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 32768 } }, { - "id": "azure/phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "family": "phi", + "id": "alibaba-cn/qwen-plus-character", + "name": "Qwen Plus Character", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "modalities": { "input": [ "text" @@ -5677,27 +5559,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.16, - "output": 0.64 + "input": 0.115, + "output": 0.287 }, "limit": { - "context": 128000, + "context": 32768, "output": 4096 } }, { - "id": "azure/phi-4", - "name": "Phi-4-reasoning", - "family": "phi", + "id": "alibaba-cn/qwen-turbo", + "name": "Qwen Turbo", + "family": "qwen", "attachment": false, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-07-15", "modalities": { "input": [ "text" @@ -5706,114 +5588,117 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.044, + "output": 0.087 }, "limit": { - "context": 32000, - "output": 4096 + "context": 1000000, + "output": 16384 } }, { - "id": "azure/phi-4-mini", - "name": "Phi-4-mini-reasoning", - "family": "phi", + "id": "alibaba-cn/qwen-vl-max", + "name": "Qwen-VL Max", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.23, + "output": 0.574 }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 } }, { - "id": "azure/phi-4-multimodal", - "name": "Phi-4-multimodal", - "family": "phi", - "attachment": true, + "id": "alibaba-cn/qwen-vl-ocr", + "name": "Qwen-VL OCR", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": false, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.08, - "output": 0.32 + "input": 0.717, + "output": 0.717 }, "limit": { - "context": 128000, + "context": 34096, "output": 4096 } }, { - "id": "azure/phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "family": "phi", + "id": "alibaba-cn/qwen-vl-plus", + "name": "Qwen-VL Plus", + "family": "qwen", "attachment": false, - "reasoning": true, - "tool_call": false, + "reasoning": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.115, + "output": 0.287 }, "limit": { - "context": 32000, - "output": 4096 + "context": 131072, + "output": 8192 } }, { - "id": "azure/text-embedding-3-large", - "name": "text-embedding-3-large", - "family": "text-embedding", + "id": "alibaba-cn/qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ "text" @@ -5822,25 +5707,27 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.13, - "output": 0.0 + "input": 0.144, + "output": 0.431 }, "limit": { - "context": 8191, - "output": 3072 + "context": 131072, + "output": 8192 } }, { - "id": "azure/text-embedding-3-small", - "name": "text-embedding-3-small", - "family": "text-embedding", + "id": "alibaba-cn/qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ "text" @@ -5849,25 +5736,27 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.02, - "output": 0.0 + "input": 0.287, + "output": 0.861 }, "limit": { - "context": 8191, - "output": 1536 + "context": 131072, + "output": 8192 } }, { - "id": "azure/text-embedding-ada-002", - "name": "text-embedding-ada-002", - "family": "text-embedding", + "id": "alibaba-cn/qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ "text" @@ -5876,27 +5765,27 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.1, - "output": 0.0 + "input": 0.574, + "output": 1.721 }, "limit": { - "context": 8192, - "output": 1536 + "context": 131072, + "output": 8192 } }, { - "id": "cohere/command-a-03", - "name": "Command A", - "family": "command-a", + "id": "alibaba-cn/qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ "text" @@ -5907,25 +5796,25 @@ }, "open_weights": true, "cost": { - "input": 2.5, - "output": 10.0 + "input": 0.072, + "output": 0.144 }, "limit": { - "context": 256000, - "output": 8000 + "context": 131072, + "output": 8192 } }, { - "id": "cohere/command-a-reasoning-08", - "name": "Command A Reasoning", - "family": "command-a", + "id": "alibaba-cn/qwen2-5-coder-32b-instruct", + "name": "Qwen2.5-Coder 32B Instruct", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "modalities": { "input": [ "text" @@ -5936,25 +5825,25 @@ }, "open_weights": true, "cost": { - "input": 2.5, - "output": 10.0 + "input": 0.287, + "output": 0.861 }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 8192 } }, { - "id": "cohere/command-a-translate-08", - "name": "Command A Translate", - "family": "command-a", + "id": "alibaba-cn/qwen2-5-coder-7b-instruct", + "name": "Qwen2.5-Coder 7B Instruct", + "family": "qwen", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "modalities": { "input": [ "text" @@ -5965,29 +5854,28 @@ }, "open_weights": true, "cost": { - "input": 2.5, - "output": 10.0 + "input": 0.144, + "output": 0.287 }, "limit": { - "context": 8000, - "output": 8000 + "context": 131072, + "output": 8192 } }, { - "id": "cohere/command-a-vision-07", - "name": "Command A Vision", - "family": "command-a", + "id": "alibaba-cn/qwen2-5-math-72b-instruct", + "name": "Qwen2.5-Math 72B Instruct", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -5995,25 +5883,25 @@ }, "open_weights": true, "cost": { - "input": 2.5, - "output": 10.0 + "input": 0.574, + "output": 1.721 }, "limit": { - "context": 128000, - "output": 8000 + "context": 4096, + "output": 3072 } }, { - "id": "cohere/command-r-08", - "name": "Command R", - "family": "command-r", + "id": "alibaba-cn/qwen2-5-math-7b-instruct", + "name": "Qwen2.5-Math 7B Instruct", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ "text" @@ -6024,57 +5912,62 @@ }, "open_weights": true, "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.144, + "output": 0.287 }, "limit": { - "context": 128000, - "output": 4000 + "context": 4096, + "output": 3072 } }, { - "id": "cohere/command-r-plus-08", - "name": "Command R+", - "family": "command-r", + "id": "alibaba-cn/qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "open_weights": true, "cost": { - "input": 2.5, - "output": 10.0 + "input": 0.087, + "output": 0.345 }, "limit": { - "context": 128000, - "output": 4000 + "context": 32768, + "output": 2048 } }, { - "id": "cohere/command-r7b-12", - "name": "Command R7B", - "family": "command-r", + "id": "alibaba-cn/qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "family": "qwen", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-06-01", - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -6082,55 +5975,55 @@ }, "open_weights": true, "cost": { - "input": 0.0375, - "output": 0.15 + "input": 2.294, + "output": 6.881 }, "limit": { - "context": 128000, - "output": 4000 + "context": 131072, + "output": 8192 } }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek Chat", - "family": "deepseek", - "attachment": true, + "id": "alibaba-cn/qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2025-09-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.028 + "input": 0.287, + "output": 0.717 }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 } }, { - "id": "deepseek/deepseek-reasoner", - "name": "DeepSeek Reasoner", - "family": "deepseek-thinking", - "attachment": true, + "id": "alibaba-cn/qwen3-14b", + "name": "Qwen3 14B", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-09-29", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ "text" @@ -6139,137 +6032,117 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.028 + "input": 0.144, + "output": 0.574 }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 } }, { - "id": "google-vertex/gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "family": "gemini-flash", - "attachment": true, - "reasoning": false, + "id": "alibaba-cn/qwen3-235b-a22b", + "name": "Qwen3 235B-A22B", + "family": "qwen", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.025 + "input": 0.287, + "output": 1.147 }, "limit": { - "context": 1048576, - "output": 8192 + "context": 131072, + "output": 16384 } }, { - "id": "google-vertex/gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "family": "gemini-flash-lite", - "attachment": true, - "reasoning": false, + "id": "alibaba-cn/qwen3-32b", + "name": "Qwen3 32B", + "family": "qwen", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.287, + "output": 1.147 }, "limit": { - "context": 1048576, - "output": 8192 + "context": 131072, + "output": 16384 } }, { - "id": "google-vertex/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "family": "gemini-flash", - "attachment": true, + "id": "alibaba-cn/qwen3-8b", + "name": "Qwen3 8B", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.072, + "output": 0.287 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 } }, { - "id": "google-vertex/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "family": "gemini-flash-lite", - "attachment": true, - "reasoning": true, - "tool_call": true, - "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "id": "alibaba-cn/qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-04", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "audio" ], "output": [ "text" @@ -6277,101 +6150,86 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.032, + "output": 0.032 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 53248, + "output": 4096 } }, { - "id": "google-vertex/gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "family": "gemini-flash-lite", - "attachment": true, - "reasoning": true, + "id": "alibaba-cn/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.216, + "output": 0.861 }, "limit": { - "context": 65536, + "context": 262144, "output": 65536 } }, { - "id": "google-vertex/gemini-2.5-flash-lite-preview-09", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "family": "gemini-flash-lite", - "attachment": true, - "reasoning": true, + "id": "alibaba-cn/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.861, + "output": 3.441 }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 } }, { - "id": "google-vertex/gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, + "id": "alibaba-cn/qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -6379,43 +6237,37 @@ }, "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.144, + "output": 0.574 }, "limit": { - "context": 1048576, + "context": 1000000, "output": 65536 } }, { - "id": "google-vertex/gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, + "id": "alibaba-cn/qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 1.0, + "output": 5.0 }, "limit": { "context": 1048576, @@ -6423,23 +6275,19 @@ } }, { - "id": "google-vertex/gemini-2.5-flash-preview-09", - "name": "Gemini 2.5 Flash Preview 09-25", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, + "id": "alibaba-cn/qwen3-max", + "name": "Qwen3 Max", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -6447,233 +6295,212 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.861, + "output": 3.441 }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 } }, { - "id": "google-vertex/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "family": "gemini-pro", - "attachment": true, - "reasoning": true, + "id": "alibaba-cn/qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next 80B-A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.31 + "input": 0.144, + "output": 0.574 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 32768 } }, { - "id": "google-vertex/gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "family": "gemini-pro", - "attachment": true, + "id": "alibaba-cn/qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next 80B-A3B (Thinking)", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.31 + "input": 0.144, + "output": 1.434 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 32768 } }, { - "id": "google-vertex/gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "family": "gemini-pro", - "attachment": true, + "id": "alibaba-cn/qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ "text", "image", "audio", - "video", - "pdf" + "video" ], "output": [ - "text" + "text", + "audio" ] }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.31 + "input": 0.058, + "output": 0.23 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 16384 } }, { - "id": "google-vertex/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, + "id": "alibaba-cn/qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "open_weights": false, "cost": { - "input": 0.5, - "output": 3.0, - "cache_read": 0.05 + "input": 0.23, + "output": 0.918 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 16384 } }, { - "id": "google-vertex/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "family": "gemini-pro", - "attachment": true, + "id": "alibaba-cn/qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 2.0, - "output": 12.0, - "cache_read": 0.2 + "input": 0.286705, + "output": 1.14682 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 32768 } }, { - "id": "google-vertex/gemini-embedding-001", - "name": "Gemini Embedding 001", - "family": "gemini", + "id": "alibaba-cn/qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "family": "qwen", "attachment": false, - "reasoning": false, - "tool_call": false, - "temperature": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.15, - "output": 0.0 + "input": 0.108, + "output": 0.431 }, "limit": { - "context": 2048, - "output": 3072 + "context": 131072, + "output": 32768 } }, { - "id": "google-vertex/gemini-flash", - "name": "Gemini Flash Latest", - "family": "gemini-flash", - "attachment": true, + "id": "alibaba-cn/qwen3-vl-plus", + "name": "Qwen3-VL Plus", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -6681,88 +6508,87 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.143353, + "output": 1.433525 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 32768 } }, { - "id": "google-vertex/gemini-flash-lite", - "name": "Gemini Flash-Lite Latest", - "family": "gemini-flash-lite", - "attachment": true, + "id": "alibaba-cn/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.43, + "output": 2.58 }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 } }, { - "id": "google-vertex/openai/gpt-oss-120b-maas", - "name": "GPT OSS 120B", - "family": "gpt-oss", + "id": "alibaba-cn/qwen3.5-plus", + "name": "Qwen3.5 Plus", + "family": "qwen", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.09, - "output": 0.36 + "input": 0.573, + "output": 3.44 }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 65536 } }, { - "id": "google-vertex/openai/gpt-oss-20b-maas", - "name": "GPT OSS 20B", - "family": "gpt-oss", + "id": "alibaba-cn/qwq-32b", + "name": "QwQ 32B", + "family": "qwen", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "modalities": { "input": [ "text" @@ -6773,25 +6599,25 @@ }, "open_weights": true, "cost": { - "input": 0.07, - "output": 0.25 + "input": 0.287, + "output": 0.861 }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 } }, { - "id": "google-vertex/zai-org/glm-4.7-maas", - "name": "GLM-4.7", - "family": "glm", + "id": "alibaba-cn/qwq-plus", + "name": "QwQ Plus", + "family": "qwen", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "modalities": { "input": [ "text" @@ -6800,33 +6626,30 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.23, + "output": 0.574 }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-1.5-flash", - "name": "Gemini 1.5 Flash", - "family": "gemini-flash", - "attachment": true, + "id": "alibaba-cn/tongyi-intent-detect-v3", + "name": "Tongyi Intent Detect V3", + "family": "yi", + "attachment": false, "reasoning": false, - "tool_call": true, + "tool_call": false, "temperature": true, "knowledge": "2024-04", - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "release_date": "2024-01", + "last_updated": "2024-01", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" @@ -6834,32 +6657,29 @@ }, "open_weights": false, "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.01875 + "input": 0.058, + "output": 0.144 }, "limit": { - "context": 1000000, - "output": 8192 + "context": 8192, + "output": 1024 } }, { - "id": "google/gemini-1.5-flash-8b", - "name": "Gemini 1.5 Flash-8B", - "family": "gemini-flash", - "attachment": true, - "reasoning": false, + "id": "alibaba/qvq-max", + "name": "QVQ Max", + "family": "qvq", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2024-04", - "release_date": "2024-10-03", - "last_updated": "2024-10-03", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" @@ -6867,32 +6687,28 @@ }, "open_weights": false, "cost": { - "input": 0.0375, - "output": 0.15, - "cache_read": 0.01 + "input": 1.2, + "output": 4.8 }, "limit": { - "context": 1000000, + "context": 131072, "output": 8192 } }, { - "id": "google/gemini-1.5-pro", - "name": "Gemini 1.5 Pro", - "family": "gemini-pro", - "attachment": true, - "reasoning": false, + "id": "alibaba/qwen-flash", + "name": "Qwen Flash", + "family": "qwen", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2024-04", - "release_date": "2024-02-15", - "last_updated": "2024-02-15", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" @@ -6900,33 +6716,28 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 5.0, - "cache_read": 0.3125 + "input": 0.05, + "output": 0.4 }, "limit": { "context": 1000000, - "output": 8192 + "output": 32768 } }, { - "id": "google/gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "family": "gemini-flash", - "attachment": true, + "id": "alibaba/qwen-max", + "name": "Qwen Max", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -6934,33 +6745,28 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 1.6, + "output": 6.4 }, "limit": { - "context": 1048576, + "context": 32768, "output": 8192 } }, { - "id": "google/gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "family": "gemini-flash-lite", - "attachment": true, + "id": "alibaba/qwen-mt-plus", + "name": "Qwen-MT Plus", + "family": "qwen", + "attachment": false, "reasoning": false, - "tool_call": true, + "tool_call": false, "temperature": true, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -6968,32 +6774,28 @@ }, "open_weights": false, "cost": { - "input": 0.075, - "output": 0.3 + "input": 2.46, + "output": 7.37 }, "limit": { - "context": 1048576, + "context": 16384, "output": 8192 } }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, - "tool_call": true, + "id": "alibaba/qwen-mt-turbo", + "name": "Qwen-MT Turbo", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -7001,97 +6803,93 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075 + "input": 0.16, + "output": 0.49 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 16384, + "output": 8192 } }, { - "id": "google/gemini-2.5-flash-image", - "name": "Gemini 2.5 Flash Image", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, - "tool_call": false, + "id": "alibaba/qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text", - "image" + "audio" ] }, "open_weights": false, "cost": { - "input": 0.3, - "output": 30.0, - "cache_read": 0.075 + "input": 0.07, + "output": 0.27 }, "limit": { "context": 32768, - "output": 32768 + "output": 2048 } }, { - "id": "google/gemini-2.5-flash-image-preview", - "name": "Gemini 2.5 Flash Image (Preview)", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, - "tool_call": false, + "id": "alibaba/qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text", - "image" + "audio" ] }, "open_weights": false, "cost": { - "input": 0.3, - "output": 30.0, - "cache_read": 0.075 + "input": 0.27, + "output": 1.07 }, "limit": { "context": 32768, - "output": 32768 + "output": 2048 } }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "family": "gemini-flash-lite", - "attachment": true, + "id": "alibaba/qwen-plus", + "name": "Qwen Plus", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -7099,33 +6897,28 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.4, + "output": 1.2 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32768 } }, { - "id": "google/gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "family": "gemini-flash-lite", - "attachment": true, - "reasoning": true, + "id": "alibaba/qwen-plus-character-ja", + "name": "Qwen Plus Character (Japanese)", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -7133,33 +6926,28 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.5, + "output": 1.4 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 512 } }, { - "id": "google/gemini-2.5-flash-lite-preview-09", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "family": "gemini-flash-lite", - "attachment": true, + "id": "alibaba/qwen-turbo", + "name": "Qwen Turbo", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-04-28", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -7167,33 +6955,29 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.05, + "output": 0.2 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 16384 } }, { - "id": "google/gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, + "id": "alibaba/qwen-vl-max", + "name": "Qwen-VL Max", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -7201,33 +6985,29 @@ }, "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.8, + "output": 3.2 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, - "tool_call": true, + "id": "alibaba/qwen-vl-ocr", + "name": "Qwen-VL OCR", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -7235,33 +7015,29 @@ }, "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.72, + "output": 0.72 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 34096, + "output": 4096 } }, { - "id": "google/gemini-2.5-flash-preview-09", - "name": "Gemini 2.5 Flash Preview 09-25", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, + "id": "alibaba/qwen-vl-plus", + "name": "Qwen-VL Plus", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -7269,254 +7045,234 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075 + "input": 0.21, + "output": 0.63 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-2.5-flash-preview-tts", - "name": "Gemini 2.5 Flash Preview TTS", - "family": "gemini-flash", + "id": "alibaba/qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, - "temperature": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.5, - "output": 10.0 + "input": 0.35, + "output": 1.4 }, "limit": { - "context": 8000, - "output": 16000 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "family": "gemini-pro", - "attachment": true, - "reasoning": true, + "id": "alibaba/qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.31 + "input": 0.7, + "output": 2.8 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "family": "gemini-pro", - "attachment": true, - "reasoning": true, + "id": "alibaba/qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.31 + "input": 1.4, + "output": 5.6 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "family": "gemini-pro", - "attachment": true, - "reasoning": true, + "id": "alibaba/qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.31 + "input": 0.175, + "output": 0.7 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-2.5-pro-preview-tts", - "name": "Gemini 2.5 Pro Preview TTS", - "family": "gemini-flash", + "id": "alibaba/qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "family": "qwen", "attachment": false, "reasoning": false, - "tool_call": false, - "temperature": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ + "text", "audio" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.0, - "output": 20.0 + "input": 0.1, + "output": 0.4 }, "limit": { - "context": 8000, - "output": 16000 + "context": 32768, + "output": 2048 } }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "family": "gemini-flash", - "attachment": true, - "reasoning": true, + "id": "alibaba/qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.5, - "output": 3.0, - "cache_read": 0.05 + "input": 2.8, + "output": 8.4 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "family": "gemini-pro", - "attachment": true, - "reasoning": true, + "id": "alibaba/qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 2.0, - "output": 12.0, - "cache_read": 0.2 + "input": 0.35, + "output": 1.05 }, "limit": { - "context": 1000000, - "output": 64000 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-embedding-001", - "name": "Gemini Embedding 001", - "family": "gemini", + "id": "alibaba/qwen3-14b", + "name": "Qwen3 14B", + "family": "qwen", "attachment": false, - "reasoning": false, - "tool_call": false, - "temperature": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ "text" @@ -7525,160 +7281,143 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.15, - "output": 0.0 + "input": 0.35, + "output": 1.4 }, "limit": { - "context": 2048, - "output": 3072 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-flash", - "name": "Gemini Flash Latest", - "family": "gemini-flash", - "attachment": true, + "id": "alibaba/qwen3-235b-a22b", + "name": "Qwen3 235B-A22B", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075 + "input": 0.7, + "output": 2.8 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 16384 } }, { - "id": "google/gemini-flash-lite", - "name": "Gemini Flash-Lite Latest", - "family": "gemini-flash-lite", - "attachment": true, + "id": "alibaba/qwen3-32b", + "name": "Qwen3 32B", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.7, + "output": 2.8 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 16384 } }, { - "id": "google/gemini-live-2.5-flash", - "name": "Gemini Live 2.5 Flash", - "family": "gemini-flash", - "attachment": true, + "id": "alibaba/qwen3-8b", + "name": "Qwen3 8B", + "family": "qwen", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.5, - "output": 2.0 + "input": 0.18, + "output": 0.7 }, "limit": { - "context": 128000, - "output": 8000 + "context": 131072, + "output": 8192 } }, { - "id": "google/gemini-live-2.5-flash-preview-native-audio", - "name": "Gemini Live 2.5 Flash Preview Native Audio", - "family": "gemini-flash", + "id": "alibaba/qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "family": "qwen", "attachment": false, - "reasoning": true, - "tool_call": true, + "reasoning": false, + "tool_call": false, "temperature": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-09-18", + "knowledge": "2024-04", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "modalities": { "input": [ - "text", - "audio", - "video" + "audio" ], "output": [ - "text", - "audio" + "text" ] }, "open_weights": false, "cost": { - "input": 0.5, - "output": 2.0 + "input": 0.035, + "output": 0.035 }, "limit": { - "context": 131072, - "output": 65536 + "context": 53248, + "output": 4096 } }, { - "id": "meta-llama/cerebras-llama-4-maverick-17b-128e-instruct", - "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", - "family": "llama", - "attachment": true, + "id": "alibaba/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ "text" @@ -7689,25 +7428,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.45, + "output": 2.25 }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 } }, { - "id": "meta-llama/cerebras-llama-4-scout-17b-16e-instruct", - "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", - "family": "llama", - "attachment": true, + "id": "alibaba/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ "text" @@ -7718,25 +7457,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.5, + "output": 7.5 }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 } }, { - "id": "meta-llama/groq-llama-4-maverick-17b-128e-instruct", - "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", - "family": "llama", - "attachment": true, + "id": "alibaba/qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -7745,27 +7484,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.3, + "output": 1.5 }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 65536 } }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "family": "llama", - "attachment": true, + "id": "alibaba/qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "modalities": { "input": [ "text" @@ -7776,88 +7515,90 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.0, + "output": 5.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 } }, { - "id": "meta-llama/llama-3.3-8b-instruct", - "name": "Llama-3.3-8B-Instruct", - "family": "llama", - "attachment": true, + "id": "alibaba/qwen3-livetranslate-flash-realtime", + "name": "Qwen3-LiveTranslate Flash Realtime", + "family": "qwen", + "attachment": false, "reasoning": false, - "tool_call": true, + "tool_call": false, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2024-04", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 10.0, + "output": 10.0 }, "limit": { - "context": 128000, + "context": 53248, "output": 4096 } }, { - "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "family": "llama", - "attachment": true, + "id": "alibaba/qwen3-max", + "name": "Qwen3 Max", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.2, + "output": 6.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 } }, { - "id": "meta-llama/llama-4-scout-17b-16e-instruct-fp8", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "family": "llama", - "attachment": true, + "id": "alibaba/qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next 80B-A3B Instruct", + "family": "qwen", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7865,25 +7606,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.5, + "output": 2.0 }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 } }, { - "id": "mistralai/codestral", - "name": "Codestral", - "family": "codestral", + "id": "alibaba/qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next 80B-A3B (Thinking)", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "modalities": { "input": [ "text" @@ -7894,86 +7635,95 @@ }, "open_weights": true, "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.5, + "output": 6.0 }, "limit": { - "context": 256000, - "output": 4096 + "context": 131072, + "output": 32768 } }, { - "id": "mistralai/devstral", - "name": "Devstral 2", - "family": "devstral", + "id": "alibaba/qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.4, - "output": 2.0 + "input": 0.43, + "output": 1.66 }, "limit": { - "context": 262144, - "output": 262144 + "context": 65536, + "output": 16384 } }, { - "id": "mistralai/devstral-medium", - "name": "Devstral 2", - "family": "devstral", + "id": "alibaba/qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "family": "qwen", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-12", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.4, - "output": 2.0 + "input": 0.52, + "output": 1.99 }, "limit": { - "context": 262144, - "output": 262144 + "context": 65536, + "output": 16384 } }, { - "id": "mistralai/devstral-small", - "name": "Devstral Small", - "family": "devstral", + "id": "alibaba/qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -7981,25 +7731,25 @@ }, "open_weights": true, "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.7, + "output": 2.8 }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 32768 } }, { - "id": "mistralai/labs-devstral-small", - "name": "Devstral Small 2", - "family": "devstral", + "id": "alibaba/qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "modalities": { "input": [ "text", @@ -8011,57 +7761,60 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.2, + "output": 0.8 }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 32768 } }, { - "id": "mistralai/magistral-medium", - "name": "Magistral Medium", - "family": "magistral-medium", + "id": "alibaba/qwen3-vl-plus", + "name": "Qwen3-VL Plus", + "family": "qwen", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 2.0, - "output": 5.0 + "input": 0.2, + "output": 1.6 }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 32768 } }, { - "id": "mistralai/magistral-small", - "name": "Magistral Small", - "family": "magistral-small", + "id": "alibaba/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "family": "qwen", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -8069,54 +7822,56 @@ }, "open_weights": true, "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.6, + "output": 3.6 }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 65536 } }, { - "id": "mistralai/ministral-3b", - "name": "Ministral 3B", - "family": "ministral", + "id": "alibaba/qwen3.5-plus", + "name": "Qwen3.5 Plus", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.4, + "output": 2.4 }, "limit": { - "context": 128000, - "output": 128000 + "context": 1000000, + "output": 65536 } }, { - "id": "mistralai/ministral-8b", - "name": "Ministral 8B", - "family": "ministral", + "id": "alibaba/qwq-plus", + "name": "QwQ Plus", + "family": "qwen", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "modalities": { "input": [ "text" @@ -8125,26 +7880,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.8, + "output": 2.4 }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 } }, { - "id": "mistralai/mistral-embed", - "name": "Mistral Embed", - "family": "mistral-embed", + "id": "amazon-bedrock/ai21.jamba-1.5-large-v1:0", + "name": "Jamba 1.5 Large", + "family": "jamba", "attachment": false, "reasoning": false, - "tool_call": false, - "temperature": false, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "modalities": { "input": [ "text" @@ -8153,27 +7909,27 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.1, - "output": 0.0 + "input": 2.0, + "output": 8.0 }, "limit": { - "context": 8000, - "output": 3072 + "context": 256000, + "output": 4096 } }, { - "id": "mistralai/mistral-large", - "name": "Mistral Large 2.1", - "family": "mistral-large", + "id": "amazon-bedrock/ai21.jamba-1.5-mini-v1:0", + "name": "Jamba 1.5 Mini", + "family": "jamba", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "knowledge": "2024-08", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "modalities": { "input": [ "text" @@ -8184,172 +7940,179 @@ }, "open_weights": true, "cost": { - "input": 2.0, - "output": 6.0 + "input": 0.2, + "output": 0.4 }, "limit": { - "context": 131072, - "output": 16384 + "context": 256000, + "output": 4096 } }, { - "id": "mistralai/mistral-medium", - "name": "Mistral Medium", - "family": "mistral-medium", + "id": "amazon-bedrock/amazon.nova-2-lite-v1:0", + "name": "Nova 2 Lite", + "family": "nova", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.4, - "output": 2.0 + "input": 0.33, + "output": 2.75 }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 } }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral Nemo", - "family": "mistral-nemo", - "attachment": false, + "id": "amazon-bedrock/amazon.nova-lite-v1:0", + "name": "Nova Lite", + "family": "nova-lite", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 }, "limit": { - "context": 128000, - "output": 128000 + "context": 300000, + "output": 8192 } }, { - "id": "mistralai/mistral-small", - "name": "Mistral Small", - "family": "mistral-small", + "id": "amazon-bedrock/amazon.nova-micro-v1:0", + "name": "Nova Micro", + "family": "nova-micro", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03", - "release_date": "2024-09-01", - "last_updated": "2024-09-04", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 } }, { - "id": "mistralai/open-mistral-7b", - "name": "Mistral 7B", - "family": "mistral", - "attachment": false, - "reasoning": false, + "id": "amazon-bedrock/amazon.nova-premier-v1:0", + "name": "Nova Premier", + "family": "nova", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2023-09-27", - "last_updated": "2023-09-27", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.25, - "output": 0.25 + "input": 2.5, + "output": 12.5 }, "limit": { - "context": 8000, - "output": 8000 + "context": 1000000, + "output": 16384 } }, { - "id": "mistralai/open-mixtral-8x22b", - "name": "Mixtral 8x22B", - "family": "mixtral", - "attachment": false, + "id": "amazon-bedrock/amazon.nova-pro-v1:0", + "name": "Nova Pro", + "family": "nova-pro", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 2.0, - "output": 6.0 + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 }, "limit": { - "context": 64000, - "output": 64000 + "context": 300000, + "output": 8192 } }, { - "id": "mistralai/open-mixtral-8x7b", - "name": "Mixtral 8x7B", - "family": "mixtral", + "id": "amazon-bedrock/amazon.titan-text-express-v1", + "name": "Titan Text G1 - Express", + "family": "titan", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-01", - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "modalities": { "input": [ "text" @@ -8358,90 +8121,91 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.2, + "output": 0.6 }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 4096 } }, { - "id": "mistralai/pixtral-12b", - "name": "Pixtral 12B", - "family": "pixtral", - "attachment": true, + "id": "amazon-bedrock/amazon.titan-text-express-v1:0:8k", + "name": "Titan Text G1 - Express", + "family": "titan", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-09", - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.2, + "output": 0.6 }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 } }, { - "id": "mistralai/pixtral-large", - "name": "Pixtral Large", - "family": "pixtral", + "id": "amazon-bedrock/anthropic.claude-3-haiku-20240307-v1:0", + "name": "Claude Haiku 3", + "family": "claude-haiku", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "knowledge": "2024-02", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 2.0, - "output": 6.0 + "input": 0.25, + "output": 1.25 }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 4096 } }, { - "id": "openai/codex-mini", - "name": "Codex Mini", - "family": "gpt-codex-mini", + "id": "amazon-bedrock/anthropic.claude-3-opus-20240229-v1:0", + "name": "Claude Opus 3", + "family": "claude-opus", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "temperature": true, + "knowledge": "2023-08", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -8449,29 +8213,30 @@ }, "open_weights": false, "cost": { - "input": 1.5, - "output": 6.0, - "cache_read": 0.375 + "input": 15.0, + "output": 75.0 }, "limit": { "context": 200000, - "output": 100000 + "output": 4096 } }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "family": "gpt", - "attachment": false, + "id": "amazon-bedrock/anthropic.claude-3-sonnet-20240229-v1:0", + "name": "Claude Sonnet 3", + "family": "claude-sonnet", + "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "knowledge": "2023-08", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -8479,29 +8244,30 @@ }, "open_weights": false, "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 + "input": 3.0, + "output": 15.0 }, "limit": { - "context": 16385, + "context": 200000, "output": 4096 } }, { - "id": "openai/gpt-4", - "name": "GPT-4", - "family": "gpt", + "id": "amazon-bedrock/anthropic.claude-3.5-haiku-20241022-v1:0", + "name": "Claude Haiku 3.5", + "family": "claude-haiku", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-07", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -8509,29 +8275,32 @@ }, "open_weights": false, "cost": { - "input": 30.0, - "output": 60.0 + "input": 0.8, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 }, "limit": { - "context": 8192, + "context": 200000, "output": 8192 } }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "family": "gpt", + "id": "amazon-bedrock/anthropic.claude-3.5-sonnet-20240620-v1:0", + "name": "Claude Sonnet 3.5", + "family": "claude-sonnet", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-04", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8539,29 +8308,32 @@ }, "open_weights": false, "cost": { - "input": 10.0, - "output": 30.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 8192 } }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "family": "gpt", + "id": "amazon-bedrock/anthropic.claude-3.5-sonnet-20241022-v2:0", + "name": "Claude Sonnet 3.5 v2", + "family": "claude-sonnet", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8569,30 +8341,32 @@ }, "open_weights": false, "cost": { - "input": 2.0, - "output": 8.0, - "cache_read": 0.5 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 8192 } }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "family": "gpt-mini", + "id": "amazon-bedrock/anthropic.claude-3.7-sonnet-20250219-v1:0", + "name": "Claude Sonnet 3.7", + "family": "claude-sonnet", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8600,30 +8374,32 @@ }, "open_weights": false, "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 8192 } }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "family": "gpt-nano", + "id": "amazon-bedrock/anthropic.claude-haiku-4.5-20251001-v1:0", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8631,30 +8407,30 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "family": "gpt", - "attachment": true, + "id": "amazon-bedrock/anthropic.claude-instant-v1", + "name": "Claude Instant", + "family": "claude", + "attachment": false, "reasoning": false, - "tool_call": true, + "tool_call": false, "temperature": true, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2023-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -8662,30 +8438,30 @@ }, "open_weights": false, "cost": { - "input": 2.5, - "output": 10.0, - "cache_read": 1.25 + "input": 0.8, + "output": 2.4 }, "limit": { - "context": 128000, - "output": 16384 + "context": 100000, + "output": 4096 } }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "family": "gpt-mini", + "id": "amazon-bedrock/anthropic.claude-opus-4-20250514-v1:0", + "name": "Claude Opus 4", + "family": "claude-opus", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8693,30 +8469,32 @@ }, "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 } }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "family": "gpt", + "id": "amazon-bedrock/anthropic.claude-opus-4.1-20250805-v1:0", + "name": "Claude Opus 4.1", + "family": "claude-opus", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8724,30 +8502,32 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 } }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5 Chat (latest)", - "family": "gpt-codex", + "id": "amazon-bedrock/anthropic.claude-opus-4.5-20251101-v1:0", + "name": "Claude Opus 4.5", + "family": "claude-opus", "attachment": true, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8755,29 +8535,32 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0 + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "family": "gpt-codex", - "attachment": false, + "id": "amazon-bedrock/anthropic.claude-opus-4.6-v1", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8785,30 +8568,32 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 } }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "family": "gpt-mini", + "id": "amazon-bedrock/anthropic.claude-sonnet-4-20250514-v1:0", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8816,30 +8601,32 @@ }, "open_weights": false, "cost": { - "input": 0.25, - "output": 2.0, - "cache_read": 0.025 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "family": "gpt-nano", + "id": "amazon-bedrock/anthropic.claude-sonnet-4.5-20250929-v1:0", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8847,30 +8634,32 @@ }, "open_weights": false, "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5 Pro", - "family": "gpt-pro", + "id": "amazon-bedrock/anthropic.claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "temperature": true, + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8878,29 +8667,293 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 120.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 400000, - "output": 272000 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "family": "gpt", - "attachment": true, - "reasoning": true, - "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "id": "amazon-bedrock/anthropic.claude-v2", + "name": "Claude 2", + "family": "claude", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-08", + "release_date": "2023-07-11", + "last_updated": "2023-07-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 8.0, + "output": 24.0 + }, + "limit": { + "context": 100000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/anthropic.claude-v2:1", + "name": "Claude 2.1", + "family": "claude", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-08", + "release_date": "2023-11-21", + "last_updated": "2023-11-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 8.0, + "output": 24.0 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/cohere.command-light-text-v14", + "name": "Command Light", + "family": "command-light", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-08", + "release_date": "2023-11-01", + "last_updated": "2023-11-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.6 + }, + "limit": { + "context": 4096, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/cohere.command-r-plus-v1:0", + "name": "Command R+", + "family": "command-r", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-04-04", + "last_updated": "2024-04-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 3.0, + "output": 15.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/cohere.command-r-v1:0", + "name": "Command R", + "family": "command-r", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-03-11", + "last_updated": "2024-03-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 1.5 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/cohere.command-text-v14", + "name": "Command", + "family": "command", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-08", + "release_date": "2023-11-01", + "last_updated": "2023-11-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.5, + "output": 2.0 + }, + "limit": { + "context": 4096, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/deepseek.r1-v1:0", + "name": "DeepSeek-R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.35, + "output": 5.4 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "amazon-bedrock/deepseek.v3-v1:0", + "name": "DeepSeek-V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.58, + "output": 1.68 + }, + "limit": { + "context": 163840, + "output": 81920 + } + }, + { + "id": "amazon-bedrock/deepseek.v3.2-v1:0", + "name": "DeepSeek-V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.62, + "output": 1.85 + }, + "limit": { + "context": 163840, + "output": 81920 + } + }, + { + "id": "amazon-bedrock/eu.anthropic.claude-haiku-4.5-20251001-v1:0", + "name": "Claude Haiku 4.5 (EU)", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8908,30 +8961,32 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.13 + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "family": "gpt-codex", + "id": "amazon-bedrock/eu.anthropic.claude-opus-4.5-20251101-v1:0", + "name": "Claude Opus 4.5 (EU)", + "family": "claude-opus", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8939,30 +8994,32 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "family": "gpt-codex", + "id": "amazon-bedrock/eu.anthropic.claude-opus-4.6-v1", + "name": "Claude Opus 4.6 (EU)", + "family": "claude-opus", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -8970,30 +9027,32 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 } }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "family": "gpt-codex", + "id": "amazon-bedrock/eu.anthropic.claude-sonnet-4-20250514-v1:0", + "name": "Claude Sonnet 4 (EU)", + "family": "claude-sonnet", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9001,30 +9060,32 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "family": "gpt-codex", + "id": "amazon-bedrock/eu.anthropic.claude-sonnet-4.5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (EU)", + "family": "claude-sonnet", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9032,30 +9093,32 @@ }, "open_weights": false, "cost": { - "input": 0.25, - "output": 2.0, - "cache_read": 0.025 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "family": "gpt", + "id": "amazon-bedrock/eu.anthropic.claude-sonnet-4.6", + "name": "Claude Sonnet 4.6 (EU)", + "family": "claude-sonnet", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "temperature": true, + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9063,30 +9126,32 @@ }, "open_weights": false, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "family": "gpt-codex", + "id": "amazon-bedrock/global.anthropic.claude-haiku-4.5-20251001-v1:0", + "name": "Claude Haiku 4.5 (Global)", + "family": "claude-haiku", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9094,88 +9159,70319 @@ }, "open_weights": false, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 } }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "family": "gpt-codex", + "id": "amazon-bedrock/global.anthropic.claude-opus-4.5-20251101-v1:0", + "name": "Claude Opus 4.5 (Global)", + "family": "claude-opus", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "amazon-bedrock/global.anthropic.claude-opus-4.6-v1", + "name": "Claude Opus 4.6 (Global)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "amazon-bedrock/global.anthropic.claude-sonnet-4-20250514-v1:0", + "name": "Claude Sonnet 4 (Global)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "amazon-bedrock/global.anthropic.claude-sonnet-4.5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (Global)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "amazon-bedrock/global.anthropic.claude-sonnet-4.6", + "name": "Claude Sonnet 4.6 (Global)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "amazon-bedrock/google.gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.049999999999999996, + "output": 0.09999999999999999 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "amazon-bedrock/google.gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.12, + "output": 0.2 + }, + "limit": { + "context": 202752, + "output": 8192 + } + }, + { + "id": "amazon-bedrock/google.gemma-3-4b-it", + "name": "Gemma 3 4B IT", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.04, + "output": 0.08 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/meta.llama3-1-70b-instruct-v1:0", + "name": "Llama 3.1 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.72, + "output": 0.72 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/meta.llama3-1-8b-instruct-v1:0", + "name": "Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 0.22 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/meta.llama3-2-11b-instruct-v1:0", + "name": "Llama 3.2 11B Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.16, + "output": 0.16 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/meta.llama3-2-1b-instruct-v1:0", + "name": "Llama 3.2 1B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 131000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/meta.llama3-2-3b-instruct-v1:0", + "name": "Llama 3.2 3B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 131000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/meta.llama3-2-90b-instruct-v1:0", + "name": "Llama 3.2 90B Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.72, + "output": 0.72 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/meta.llama3-3-70b-instruct-v1:0", + "name": "Llama 3.3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.72, + "output": 0.72 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/meta.llama3-70b-instruct-v1:0", + "name": "Llama 3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.65, + "output": 3.5 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "amazon-bedrock/meta.llama3-8b-instruct-v1:0", + "name": "Llama 3 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-03", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.6 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "amazon-bedrock/meta.llama4-maverick-17b-instruct-v1:0", + "name": "Llama 4 Maverick 17B Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.24, + "output": 0.97 + }, + "limit": { + "context": 1000000, + "output": 16384 + } + }, + { + "id": "amazon-bedrock/meta.llama4-scout-17b-instruct-v1:0", + "name": "Llama 4 Scout 17B Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.17, + "output": 0.66 + }, + "limit": { + "context": 3500000, + "output": 16384 + } + }, + { + "id": "amazon-bedrock/minimax.minimax-m2", + "name": "MiniMax M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204608, + "output": 128000 + } + }, + { + "id": "amazon-bedrock/minimax.minimax-m2.1", + "name": "MiniMax M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "amazon-bedrock/mistral.ministral-3-14b-instruct", + "name": "Ministral 14B 3.0", + "family": "ministral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/mistral.ministral-3-8b-instruct", + "name": "Ministral 3 8B", + "family": "ministral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/mistral.mistral-7b-instruct-v0:2", + "name": "Mistral-7B-Instruct-v0.3", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.11, + "output": 0.11 + }, + "limit": { + "context": 127000, + "output": 127000 + } + }, + { + "id": "amazon-bedrock/mistral.mistral-large-2402-v1:0", + "name": "Mistral Large (24.02)", + "family": "mistral-large", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 1.5 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/mistral.mixtral-8x7b-instruct-v0:1", + "name": "Mixtral-8x7B-Instruct-v0.1", + "family": "mixtral", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 0.7 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "amazon-bedrock/mistral.voxtral-mini-3b", + "name": "Voxtral Mini 3B 2507", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "audio", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.04, + "output": 0.04 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/mistral.voxtral-small-24b", + "name": "Voxtral Small 24B 2507", + "family": "mistral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "modalities": { + "input": [ + "text", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.35 + }, + "limit": { + "context": 32000, + "output": 8192 + } + }, + { + "id": "amazon-bedrock/moonshot.kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "amazon-bedrock/moonshotai.kimi-k2.5", + "name": "Kimi K2.5", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-06", + "last_updated": "2026-02-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "amazon-bedrock/nvidia.nemotron-nano-12b-v2", + "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", + "family": "nemotron", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/nvidia.nemotron-nano-9b-v2", + "name": "NVIDIA Nemotron Nano 9B v2", + "family": "nemotron", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.06, + "output": 0.23 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/openai.gpt-oss-120b-1:0", + "name": "gpt-oss-120b", + "family": "gpt-oss", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/openai.gpt-oss-20b-1:0", + "name": "gpt-oss-20b", + "family": "gpt-oss", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/openai.gpt-oss-safeguard-120b", + "name": "GPT OSS Safeguard 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/openai.gpt-oss-safeguard-20b", + "name": "GPT OSS Safeguard 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.2 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "amazon-bedrock/qwen.qwen3-235b-a22b-2507-v1:0", + "name": "Qwen3 235B A22B 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 0.88 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "amazon-bedrock/qwen.qwen3-32b-v1:0", + "name": "Qwen3 32B (dense)", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "amazon-bedrock/qwen.qwen3-coder-30b-a3b-v1:0", + "name": "Qwen3 Coder 30B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "amazon-bedrock/qwen.qwen3-coder-480b-a35b-v1:0", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 1.8 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "amazon-bedrock/qwen.qwen3-next-80b-a3b", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 1.4 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "amazon-bedrock/qwen.qwen3-vl-235b-a22b", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "amazon-bedrock/us.anthropic.claude-haiku-4.5-20251001-v1:0", + "name": "Claude Haiku 4.5 (US)", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "amazon-bedrock/us.anthropic.claude-opus-4-20250514-v1:0", + "name": "Claude Opus 4 (US)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "amazon-bedrock/us.anthropic.claude-opus-4.1-20250805-v1:0", + "name": "Claude Opus 4.1 (US)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "amazon-bedrock/us.anthropic.claude-opus-4.5-20251101-v1:0", + "name": "Claude Opus 4.5 (US)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "amazon-bedrock/us.anthropic.claude-opus-4.6-v1", + "name": "Claude Opus 4.6 (US)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "amazon-bedrock/us.anthropic.claude-sonnet-4-20250514-v1:0", + "name": "Claude Sonnet 4 (US)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "amazon-bedrock/us.anthropic.claude-sonnet-4.5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (US)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "amazon-bedrock/us.anthropic.claude-sonnet-4.6", + "name": "Claude Sonnet 4.6 (US)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "amazon-bedrock/writer.palmyra-x4-v1:0", + "name": "Palmyra X4", + "family": "palmyra", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 122880, + "output": 8192 + } + }, + { + "id": "amazon-bedrock/writer.palmyra-x5-v1:0", + "name": "Palmyra X5", + "family": "palmyra", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.6, + "output": 6.0 + }, + "limit": { + "context": 1040000, + "output": 8192 + } + }, + { + "id": "amazon-bedrock/zai.glm-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "amazon-bedrock/zai.glm-4.7-flash", + "name": "GLM-4.7-Flash", + "family": "glm-flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.4 + }, + "limit": { + "context": 200000, + "output": 131072 + } + }, + { + "id": "anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "anthropic/claude-3-opus", + "name": "Claude Opus 3", + "family": "claude-opus", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "anthropic/claude-3-sonnet", + "name": "Claude Sonnet 3", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 0.3 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04-30", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7 (latest)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "anthropic/claude-opus-4.0", + "name": "Claude Opus 4 (latest)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "anthropic/claude-sonnet-4.0", + "name": "Claude Sonnet 4 (latest)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "azure-cognitive-services/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "azure-cognitive-services/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "azure-cognitive-services/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "azure-cognitive-services/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "azure-cognitive-services/codestral", + "name": "Codestral 25.01", + "family": "codestral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "azure-cognitive-services/codex-mini", + "name": "Codex Mini", + "family": "gpt-codex-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.5, + "output": 6.0, + "cache_read": 0.375 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure-cognitive-services/cohere-command-a", + "name": "Command A", + "family": "command-a", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 256000, + "output": 8000 + } + }, + { + "id": "azure-cognitive-services/cohere-command-r-08", + "name": "Command R", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "azure-cognitive-services/cohere-command-r-plus-08", + "name": "Command R+", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "azure-cognitive-services/cohere-embed-v-4.0", + "name": "Embed v4", + "family": "cohere-embed", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.12, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 1536 + } + }, + { + "id": "azure-cognitive-services/cohere-embed-v3-english", + "name": "Embed v3 English", + "family": "cohere-embed", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.0 + }, + "limit": { + "context": 512, + "output": 1024 + } + }, + { + "id": "azure-cognitive-services/cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "family": "cohere-embed", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.0 + }, + "limit": { + "context": 512, + "output": 1024 + } + }, + { + "id": "azure-cognitive-services/deepseek-r1", + "name": "DeepSeek-R1-0528", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.35, + "output": 5.4 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "azure-cognitive-services/deepseek-v3", + "name": "DeepSeek-V3-0324", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.14, + "output": 4.56 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "azure-cognitive-services/deepseek-v3.1", + "name": "DeepSeek-V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.56, + "output": 1.68 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "azure-cognitive-services/deepseek-v3.2", + "name": "DeepSeek-V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.58, + "output": 1.68 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.58, + "output": 1.68 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo 0125", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 1.5 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "azure-cognitive-services/gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.5, + "output": 2.0 + }, + "limit": { + "context": 4096, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/gpt-4", + "name": "GPT-4", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 60.0, + "output": 120.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "azure-cognitive-services/gpt-4-32k", + "name": "GPT-4 32K", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 60.0, + "output": 120.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/gpt-4-turbo", + "name": "GPT-4 Turbo", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 30.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 30.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/gpt-4o", + "name": "GPT-4o", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 10.0, + "cache_read": 1.25 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure-cognitive-services/gpt-4o-mini", + "name": "GPT-4o mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure-cognitive-services/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 272000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/gpt-5-chat", + "name": "GPT-5 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure-cognitive-services/gpt-5-codex", + "name": "GPT-5-Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.03 + }, + "limit": { + "context": 272000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + }, + "limit": { + "context": 272000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/gpt-5-pro", + "name": "GPT-5 Pro", + "family": "gpt-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 120.0 + }, + "limit": { + "context": 400000, + "output": 272000 + } + }, + { + "id": "azure-cognitive-services/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "image", + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 272000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "image", + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure-cognitive-services/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "image", + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure-cognitive-services/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/grok-3", + "name": "Grok 3", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "azure-cognitive-services/grok-3-mini", + "name": "Grok 3 Mini", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "azure-cognitive-services/grok-4", + "name": "Grok 4", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "azure-cognitive-services/grok-4-fast", + "name": "Grok 4 Fast (Reasoning)", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "azure-cognitive-services/grok-4-fast-non", + "name": "Grok 4 Fast (Non-Reasoning)", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "azure-cognitive-services/grok-code-fast-1", + "name": "Grok Code Fast 1", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + }, + "limit": { + "context": 256000, + "output": 10000 + } + }, + { + "id": "azure-cognitive-services/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-12-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "azure-cognitive-services/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "azure-cognitive-services/llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.37, + "output": 0.37 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure-cognitive-services/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.04, + "output": 2.04 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure-cognitive-services/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.71, + "output": 0.71 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure-cognitive-services/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.78 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure-cognitive-services/mai-ds-r1", + "name": "MAI-DS-R1", + "family": "mai", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.35, + "output": 5.4 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure-cognitive-services/meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.68, + "output": 3.54 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "azure-cognitive-services/meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.61 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "azure-cognitive-services/meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 5.33, + "output": 16.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.68, + "output": 3.54 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.61 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/ministral-3b", + "name": "Ministral 3B", + "family": "ministral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.04 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure-cognitive-services/mistral-large", + "name": "Mistral Large 24.11", + "family": "mistral-large", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 6.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/mistral-medium", + "name": "Mistral Medium 3", + "family": "mistral-medium", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/mistral-nemo", + "name": "Mistral Nemo", + "family": "mistral-nemo", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "azure-cognitive-services/mistral-small", + "name": "Mistral Small 3.1", + "family": "mistral-small", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/model-router", + "name": "Model Router", + "family": "model-router", + "attachment": true, + "reasoning": false, + "tool_call": true, + "release_date": "2025-05-19", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure-cognitive-services/o1", + "name": "o1", + "family": "o", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 60.0, + "cache_read": 7.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure-cognitive-services/o1-mini", + "name": "o1-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 128000, + "output": 65536 + } + }, + { + "id": "azure-cognitive-services/o1-preview", + "name": "o1-preview", + "family": "o", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 16.5, + "output": 66.0, + "cache_read": 8.25 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure-cognitive-services/o3", + "name": "o3", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure-cognitive-services/o3-mini", + "name": "o3-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure-cognitive-services/o4-mini", + "name": "o4-mini", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure-cognitive-services/phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.17, + "output": 0.68 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.17, + "output": 0.68 + }, + "limit": { + "context": 4096, + "output": 1024 + } + }, + { + "id": "azure-cognitive-services/phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.52 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.52 + }, + "limit": { + "context": 4096, + "output": 1024 + } + }, + { + "id": "azure-cognitive-services/phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "azure-cognitive-services/phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.52 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.16, + "output": 0.64 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/phi-4", + "name": "Phi-4", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.125, + "output": 0.5 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/phi-4-mini", + "name": "Phi-4-mini", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.075, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/phi-4-multimodal", + "name": "Phi-4-multimodal", + "family": "phi", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.32 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.125, + "output": 0.5 + }, + "limit": { + "context": 32000, + "output": 4096 + } + }, + { + "id": "azure-cognitive-services/text-embedding-3-large", + "name": "text-embedding-3-large", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.13, + "output": 0.0 + }, + "limit": { + "context": 8191, + "output": 3072 + } + }, + { + "id": "azure-cognitive-services/text-embedding-3-small", + "name": "text-embedding-3-small", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.02, + "output": 0.0 + }, + "limit": { + "context": 8191, + "output": 1536 + } + }, + { + "id": "azure-cognitive-services/text-embedding-ada-002", + "name": "text-embedding-ada-002", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2022-12-15", + "last_updated": "2022-12-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 1536 + } + }, + { + "id": "azure/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "azure/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "azure/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "azure/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "azure/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "azure/codestral", + "name": "Codestral 25.01", + "family": "codestral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "azure/codex-mini", + "name": "Codex Mini", + "family": "gpt-codex-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.5, + "output": 6.0, + "cache_read": 0.375 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure/cohere-command-a", + "name": "Command A", + "family": "command-a", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 256000, + "output": 8000 + } + }, + { + "id": "azure/cohere-command-r-08", + "name": "Command R", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "azure/cohere-command-r-plus-08", + "name": "Command R+", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "azure/cohere-embed-v-4.0", + "name": "Embed v4", + "family": "cohere-embed", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.12, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 1536 + } + }, + { + "id": "azure/cohere-embed-v3-english", + "name": "Embed v3 English", + "family": "cohere-embed", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.0 + }, + "limit": { + "context": 512, + "output": 1024 + } + }, + { + "id": "azure/cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "family": "cohere-embed", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.0 + }, + "limit": { + "context": 512, + "output": 1024 + } + }, + { + "id": "azure/deepseek-r1", + "name": "DeepSeek-R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.35, + "output": 5.4 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "azure/deepseek-v3", + "name": "DeepSeek-V3-0324", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.14, + "output": 4.56 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "azure/deepseek-v3.1", + "name": "DeepSeek-V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.56, + "output": 1.68 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "azure/deepseek-v3.2", + "name": "DeepSeek-V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.58, + "output": 1.68 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "azure/deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.58, + "output": 1.68 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "azure/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo 1106", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "azure/gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.5, + "output": 2.0 + }, + "limit": { + "context": 4096, + "output": 4096 + } + }, + { + "id": "azure/gpt-4", + "name": "GPT-4", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 60.0, + "output": 120.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "azure/gpt-4-32k", + "name": "GPT-4 32K", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 60.0, + "output": 120.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "azure/gpt-4-turbo", + "name": "GPT-4 Turbo", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 30.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure/gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 30.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "azure/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "azure/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "azure/gpt-4o", + "name": "GPT-4o", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 10.0, + "cache_read": 1.25 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure/gpt-4o-mini", + "name": "GPT-4o mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 272000, + "output": 128000 + } + }, + { + "id": "azure/gpt-5-chat", + "name": "GPT-5 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure/gpt-5-codex", + "name": "GPT-5-Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.03 + }, + "limit": { + "context": 272000, + "output": 128000 + } + }, + { + "id": "azure/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + }, + "limit": { + "context": 272000, + "output": 128000 + } + }, + { + "id": "azure/gpt-5-pro", + "name": "GPT-5 Pro", + "family": "gpt-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 120.0 + }, + "limit": { + "context": 400000, + "output": 272000 + } + }, + { + "id": "azure/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "image", + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 272000, + "output": 128000 + } + }, + { + "id": "azure/gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "image", + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "image", + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure/gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "azure/grok-3", + "name": "Grok 3", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "azure/grok-3-mini", + "name": "Grok 3 Mini", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "azure/grok-4", + "name": "Grok 4", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "azure/grok-4-fast", + "name": "Grok 4 Fast (Reasoning)", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "azure/grok-4-fast-non", + "name": "Grok 4 Fast (Non-Reasoning)", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "azure/grok-code-fast-1", + "name": "Grok Code Fast 1", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + }, + "limit": { + "context": 256000, + "output": 10000 + } + }, + { + "id": "azure/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-12-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "azure/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "azure/llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.37, + "output": 0.37 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.04, + "output": 2.04 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.71, + "output": 0.71 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.78 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure/mai-ds-r1", + "name": "MAI-DS-R1", + "family": "mai", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.35, + "output": 5.4 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure/meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.68, + "output": 3.54 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "azure/meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.61 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "azure/meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 5.33, + "output": 16.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure/meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.68, + "output": 3.54 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.61 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure/ministral-3b", + "name": "Ministral 3B", + "family": "ministral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.04 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "azure/mistral-large", + "name": "Mistral Large 24.11", + "family": "mistral-large", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 6.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure/mistral-medium", + "name": "Mistral Medium 3", + "family": "mistral-medium", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "azure/mistral-nemo", + "name": "Mistral Nemo", + "family": "mistral-nemo", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "azure/mistral-small", + "name": "Mistral Small 3.1", + "family": "mistral-small", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure/model-router", + "name": "Model Router", + "family": "model-router", + "attachment": true, + "reasoning": false, + "tool_call": true, + "release_date": "2025-05-19", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "azure/o1", + "name": "o1", + "family": "o", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 60.0, + "cache_read": 7.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure/o1-mini", + "name": "o1-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 128000, + "output": 65536 + } + }, + { + "id": "azure/o1-preview", + "name": "o1-preview", + "family": "o", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 16.5, + "output": 66.0, + "cache_read": 8.25 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "azure/o3", + "name": "o3", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure/o3-mini", + "name": "o3-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure/o4-mini", + "name": "o4-mini", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "azure/phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.17, + "output": 0.68 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure/phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.17, + "output": 0.68 + }, + "limit": { + "context": 4096, + "output": 1024 + } + }, + { + "id": "azure/phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.52 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure/phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.52 + }, + "limit": { + "context": 4096, + "output": 1024 + } + }, + { + "id": "azure/phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure/phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "azure/phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.52 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure/phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.16, + "output": 0.64 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure/phi-4", + "name": "Phi-4-reasoning", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.125, + "output": 0.5 + }, + "limit": { + "context": 32000, + "output": 4096 + } + }, + { + "id": "azure/phi-4-mini", + "name": "Phi-4-mini-reasoning", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.075, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure/phi-4-multimodal", + "name": "Phi-4-multimodal", + "family": "phi", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.32 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "azure/phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.125, + "output": 0.5 + }, + "limit": { + "context": 32000, + "output": 4096 + } + }, + { + "id": "azure/text-embedding-3-large", + "name": "text-embedding-3-large", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.13, + "output": 0.0 + }, + "limit": { + "context": 8191, + "output": 3072 + } + }, + { + "id": "azure/text-embedding-3-small", + "name": "text-embedding-3-small", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.02, + "output": 0.0 + }, + "limit": { + "context": 8191, + "output": 1536 + } + }, + { + "id": "azure/text-embedding-ada-002", + "name": "text-embedding-ada-002", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2022-12-15", + "last_updated": "2022-12-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 1536 + } + }, + { + "id": "bailing/Ling-1T", + "name": "Ling-1T", + "family": "ling", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-10", + "last_updated": "2025-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.57, + "output": 2.29 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "bailing/Ring-1T", + "name": "Ring-1T", + "family": "ring", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-10", + "last_updated": "2025-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.57, + "output": 2.29 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "baseten/Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.38, + "output": 1.53 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "baseten/deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.45 + }, + "limit": { + "context": 163800, + "output": 131100 + } + }, + { + "id": "baseten/moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2 Instruct 0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "baseten/moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "baseten/moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2026-01-30", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0 + }, + "limit": { + "context": 262144, + "output": 8192 + } + }, + { + "id": "baseten/zai-org/GLM-4.6", + "name": "GLM 4.6", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08-31", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 200000, + "output": 200000 + } + }, + { + "id": "baseten/zai-org/GLM-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "baseten/zai-org/GLM-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2026-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.95, + "output": 3.15 + }, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "berget/BAAI/bge-reranker-v2-m3", + "name": "bge-reranker-v2-m3", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-04", + "release_date": "2025-04-23", + "last_updated": "2025-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 512, + "output": 512 + } + }, + { + "id": "berget/KBLab/kb-whisper-large", + "name": "KB-Whisper-Large", + "family": "whisper", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-04", + "release_date": "2025-04-27", + "last_updated": "2025-04-27", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 3.0, + "output": 3.0 + }, + "limit": { + "context": 480000, + "output": 4800 + } + }, + { + "id": "berget/intfloat/multilingual-e5-large", + "name": "Multilingual-E5-large", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-09", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.0 + }, + "limit": { + "context": 512, + "output": 1024 + } + }, + { + "id": "berget/intfloat/multilingual-e5-large-instruct", + "name": "Multilingual-E5-large-instruct", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-04", + "release_date": "2025-04-27", + "last_updated": "2025-04-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.0 + }, + "limit": { + "context": 512, + "output": 1024 + } + }, + { + "id": "berget/meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-04-27", + "last_updated": "2025-04-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.9, + "output": 0.9 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "berget/mistralai/Mistral-Small-3.2-24B-Instruct", + "name": "Mistral Small 3.2 24B Instruct 2506", + "family": "mistral-small", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.3 + }, + "limit": { + "context": 32000, + "output": 8192 + } + }, + { + "id": "berget/openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "berget/zai-org/GLM-4.7", + "name": "GLM 4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 2.3 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "cerebras/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.69 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "cerebras/llama3.1-8b", + "name": "Llama 3.1 8B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 32000, + "output": 8000 + } + }, + { + "id": "cerebras/qwen-3-235b-a22b-instruct", + "name": "Qwen 3 235B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.2 + }, + "limit": { + "context": 131000, + "output": 32000 + } + }, + { + "id": "cerebras/zai-glm-4.7", + "name": "Z.AI GLM-4.7", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-10", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.25, + "output": 2.75, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 131072, + "output": 40000 + } + }, + { + "id": "chutes/MiniMaxAI/MiniMax-M2.1-TEE", + "name": "MiniMax M2.1 TEE", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.12 + }, + "limit": { + "context": 196608, + "output": 65536 + } + }, + { + "id": "chutes/MiniMaxAI/MiniMax-M2.5-TEE", + "name": "MiniMax M2.5 TEE", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 196608, + "output": 65536 + } + }, + { + "id": "chutes/NousResearch/DeepHermes-3-Mistral-24B-Preview", + "name": "DeepHermes 3 Mistral 24B Preview", + "family": "nousresearch", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.1 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "chutes/NousResearch/Hermes-4-14B", + "name": "Hermes 4 14B", + "family": "nousresearch", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.05 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "chutes/NousResearch/Hermes-4-405B-FP8-TEE", + "name": "Hermes 4 405B FP8 TEE", + "family": "nousresearch", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "chutes/NousResearch/Hermes-4-70B", + "name": "Hermes 4 70B", + "family": "nousresearch", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.11, + "output": 0.38 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "chutes/NousResearch/Hermes-4.3-36B", + "name": "Hermes 4.3 36B", + "family": "nousresearch", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.39 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "chutes/OpenGVLab/InternVL3-78B-TEE", + "name": "InternVL3 78B TEE", + "family": "opengvlab", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-01-06", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.39 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "chutes/Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen2.5 72B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.52 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "chutes/Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.11 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "chutes/Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen2.5 VL 32B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.22 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "chutes/Qwen/Qwen2.5-VL-72B-Instruct-TEE", + "name": "Qwen2.5 VL 72B Instruct TEE", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "chutes/Qwen/Qwen3-14B", + "name": "Qwen3 14B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.22 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "chutes/Qwen/Qwen3-235B-A22B", + "name": "Qwen3 235B A22B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "chutes/Qwen/Qwen3-235B-A22B-Instruct-2507-TEE", + "name": "Qwen3 235B A22B Instruct 2507 TEE", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.55, + "cache_read": 0.04 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "chutes/Qwen/Qwen3-235B-A22B-Thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.11, + "output": 0.6 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "chutes/Qwen/Qwen3-30B-A3B", + "name": "Qwen3 30B A3B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.22 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "chutes/Qwen/Qwen3-30B-A3B-Instruct", + "name": "Qwen3 30B A3B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.33 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "chutes/Qwen/Qwen3-32B", + "name": "Qwen3 32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.24, + "cache_read": 0.04 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "chutes/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8-TEE", + "name": "Qwen3 Coder 480B A35B Instruct FP8 TEE", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 0.95, + "cache_read": 0.11 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "chutes/Qwen/Qwen3-Coder-Next", + "name": "Qwen3 Coder Next", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.3 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "chutes/Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.8 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "chutes/Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "chutes/Qwen/Qwen3.5-397B-A17B-TEE", + "name": "Qwen3.5 397B A17B TEE", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-18", + "last_updated": "2026-02-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "chutes/Qwen/Qwen3Guard-Gen-0.6B", + "name": "Qwen3Guard Gen 0.6B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.01, + "cache_read": 0.005 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "chutes/XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo V2 Flash", + "family": "mimo", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.29 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "chutes/chutesai/Mistral-Small-3.1-24B-Instruct", + "name": "Mistral Small 3.1 24B Instruct 2503", + "family": "chutesai", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.11, + "cache_read": 0.015 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "chutes/chutesai/Mistral-Small-3.2-24B-Instruct", + "name": "Mistral Small 3.2 24B Instruct 2506", + "family": "chutesai", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.18 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "chutes/deepseek-ai/DeepSeek-R1-0528-TEE", + "name": "DeepSeek R1 0528 TEE", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.75 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "chutes/deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "name": "DeepSeek R1 Distill Llama 70B", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.11 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "chutes/deepseek-ai/DeepSeek-R1-TEE", + "name": "DeepSeek R1 TEE", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "chutes/deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "chutes/deepseek-ai/DeepSeek-V3-0324-TEE", + "name": "DeepSeek V3 0324 TEE", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.19, + "output": 0.87, + "cache_read": 0.095 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "chutes/deepseek-ai/DeepSeek-V3.1-TEE", + "name": "DeepSeek V3.1 TEE", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "chutes/deepseek-ai/DeepSeek-V3.1-Terminus-TEE", + "name": "DeepSeek V3.1 Terminus TEE", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.23, + "output": 0.9 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "chutes/deepseek-ai/DeepSeek-V3.2-Speciale-TEE", + "name": "DeepSeek V3.2 Speciale TEE", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 0.41 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "chutes/deepseek-ai/DeepSeek-V3.2-TEE", + "name": "DeepSeek V3.2 TEE", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.38, + "cache_read": 0.125 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "chutes/miromind-ai/MiroThinker-v1.5-235B", + "name": "MiroThinker V1.5 235B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2026-01-10", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 8192 + } + }, + { + "id": "chutes/mistralai/Devstral-2-123B-Instruct-2512-TEE", + "name": "Devstral 2 123B Instruct 2512 TEE", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-10", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.22 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "chutes/moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2 Instruct 0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.39, + "output": 1.9, + "cache_read": 0.195 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "chutes/moonshotai/Kimi-K2-Thinking-TEE", + "name": "Kimi K2 Thinking TEE", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.75 + }, + "limit": { + "context": 262144, + "output": 65535 + } + }, + { + "id": "chutes/moonshotai/Kimi-K2.5-TEE", + "name": "Kimi K2.5 TEE", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0 + }, + "limit": { + "context": 262144, + "output": 65535 + } + }, + { + "id": "chutes/nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16", + "name": "NVIDIA Nemotron 3 Nano 30B A3B BF16", + "family": "nemotron", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.24 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "chutes/openai/gpt-oss-120b-TEE", + "name": "gpt oss 120b TEE", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.18 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "chutes/openai/gpt-oss-20b", + "name": "gpt oss 20b", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.1 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "chutes/rednote-hilab/dots.ocr", + "name": "dots.ocr", + "family": "rednote", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.01, + "cache_read": 0.005 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "chutes/tngtech/DeepSeek-R1T-Chimera", + "name": "DeepSeek R1T Chimera", + "family": "tngtech", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "chutes/tngtech/DeepSeek-TNG-R1T2-Chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "family": "tngtech", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.85 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "chutes/tngtech/TNG-R1T-Chimera-TEE", + "name": "TNG R1T Chimera TEE", + "family": "tngtech", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.85 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "chutes/tngtech/TNG-R1T-Chimera-Turbo", + "name": "TNG R1T Chimera Turbo", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 0.6 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "chutes/unsloth/Llama-3.2-1B-Instruct", + "name": "Llama 3.2 1B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.01, + "cache_read": 0.005 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "chutes/unsloth/Llama-3.2-3B-Instruct", + "name": "Llama 3.2 3B Instruct", + "family": "unsloth", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-02-12", + "last_updated": "2025-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.01, + "cache_read": 0.005 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "chutes/unsloth/Mistral-Nemo-Instruct", + "name": "Mistral Nemo Instruct 2407", + "family": "unsloth", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.04, + "cache_read": 0.01 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "chutes/unsloth/Mistral-Small-24B-Instruct", + "name": "Mistral Small 24B Instruct 2501", + "family": "unsloth", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.11 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "chutes/unsloth/gemma-3-12b-it", + "name": "gemma 3 12b it", + "family": "unsloth", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.1 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "chutes/unsloth/gemma-3-27b-it", + "name": "gemma 3 27b it", + "family": "unsloth", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.15, + "cache_read": 0.02 + }, + "limit": { + "context": 128000, + "output": 65536 + } + }, + { + "id": "chutes/unsloth/gemma-3-4b-it", + "name": "gemma 3 4b it", + "family": "unsloth", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.03 + }, + "limit": { + "context": 96000, + "output": 96000 + } + }, + { + "id": "chutes/zai-org/GLM-4.5-Air", + "name": "GLM 4.5 Air", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.22 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "chutes/zai-org/GLM-4.5-FP8", + "name": "GLM 4.5 FP8", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "chutes/zai-org/GLM-4.5-TEE", + "name": "GLM 4.5 TEE", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.35, + "output": 1.55 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "chutes/zai-org/GLM-4.6-FP8", + "name": "GLM 4.6 FP8", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 202752, + "output": 65535 + } + }, + { + "id": "chutes/zai-org/GLM-4.6-TEE", + "name": "GLM 4.6 TEE", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.35, + "output": 1.5 + }, + "limit": { + "context": 202752, + "output": 65536 + } + }, + { + "id": "chutes/zai-org/GLM-4.6V", + "name": "GLM 4.6V", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "chutes/zai-org/GLM-4.7-FP8", + "name": "GLM 4.7 FP8", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 202752, + "output": 65535 + } + }, + { + "id": "chutes/zai-org/GLM-4.7-Flash", + "name": "GLM 4.7 Flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.35 + }, + "limit": { + "context": 202752, + "output": 65535 + } + }, + { + "id": "chutes/zai-org/GLM-4.7-TEE", + "name": "GLM 4.7 TEE", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.5 + }, + "limit": { + "context": 202752, + "output": 65535 + } + }, + { + "id": "chutes/zai-org/GLM-5-TEE", + "name": "GLM 5 TEE", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.75, + "output": 2.5 + }, + "limit": { + "context": 202752, + "output": 65535 + } + }, + { + "id": "cloudferro-sherlock/meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-09", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.92, + "output": 2.92 + }, + "limit": { + "context": 70000, + "output": 70000 + } + }, + { + "id": "cloudferro-sherlock/openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.92, + "output": 2.92 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "cloudferro-sherlock/speakleash/Bielik-11B-v2.6-Instruct", + "name": "Bielik 11B v2.6 Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.67, + "output": 0.67 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "cloudferro-sherlock/speakleash/Bielik-11B-v3.0-Instruct", + "name": "Bielik 11B v3.0 Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.67, + "output": 0.67 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-3-opus", + "name": "Claude Opus 3", + "family": "claude-opus", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-3-sonnet", + "name": "Claude Sonnet 3", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 0.3 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5 (latest)", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5 (latest)", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-opus-4", + "name": "Claude Opus 4 (latest)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1 (latest)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5 (latest)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6 (latest)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4 (latest)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5 (latest)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "cloudflare-ai-gateway/anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "cloudflare-ai-gateway/openai/gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 + }, + "limit": { + "context": 16385, + "output": 4096 + } + }, + { + "id": "cloudflare-ai-gateway/openai/gpt-4", + "name": "GPT-4", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 30.0, + "output": 60.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "cloudflare-ai-gateway/openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 30.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "cloudflare-ai-gateway/openai/gpt-4o", + "name": "GPT-4o", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 10.0, + "cache_read": 1.25 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/openai/gpt-4o-mini", + "name": "GPT-4o mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/openai/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "cloudflare-ai-gateway/openai/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "cloudflare-ai-gateway/openai/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "cloudflare-ai-gateway/openai/o1", + "name": "o1", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 60.0, + "cache_read": 7.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "cloudflare-ai-gateway/openai/o3", + "name": "o3", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "cloudflare-ai-gateway/openai/o3-mini", + "name": "o3-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "cloudflare-ai-gateway/openai/o3-pro", + "name": "o3-pro", + "family": "o-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 20.0, + "output": 80.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "cloudflare-ai-gateway/openai/o4-mini", + "name": "o4-mini", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/ai4bharat/indictrans2-en-indic-1B", + "name": "IndicTrans2 EN-Indic 1B", + "family": "indictrans", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.34, + "output": 0.34 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/aisingapore/gemma-sea-lion-v4-27b-it", + "name": "Gemma SEA-LION v4 27B IT", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.35, + "output": 0.56 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/baai/bge-base-en-v1.5", + "name": "BGE Base EN v1.5", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.067, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/baai/bge-large-en-v1.5", + "name": "BGE Large EN v1.5", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/baai/bge-m3", + "name": "BGE M3", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.012, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/baai/bge-reranker-base", + "name": "BGE Reranker Base", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-09", + "last_updated": "2025-04-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0031, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/baai/bge-small-en-v1.5", + "name": "BGE Small EN v1.5", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.02, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/deepgram/aura-2-en", + "name": "Deepgram Aura 2 (EN)", + "family": "aura", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/deepgram/aura-2-es", + "name": "Deepgram Aura 2 (ES)", + "family": "aura", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/deepgram/nova-3", + "name": "Deepgram Nova 3", + "family": "nova", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/deepseek-ai/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 4.88 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/facebook/bart-large-cnn", + "name": "BART Large CNN", + "family": "bart", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-09", + "last_updated": "2025-04-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/google/gemma-3-12b-it", + "name": "Gemma 3 12B IT", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.35, + "output": 0.56 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/huggingface/distilbert-sst-2-int8", + "name": "DistilBERT SST-2 INT8", + "family": "distilbert", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.026, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/ibm-granite/granite-4.0-h-micro", + "name": "IBM Granite 4.0 H Micro", + "family": "granite", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.017, + "output": 0.11 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-2-7b-chat-fp16", + "name": "Llama 2 7B Chat FP16", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.56, + "output": 6.67 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.28, + "output": 0.83 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-3-8b-instruct-awq", + "name": "Llama 3 8B Instruct AWQ", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.12, + "output": 0.27 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.28, + "output": 0.8299999999999998 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-3.1-8b-instruct-awq", + "name": "Llama 3.1 8B Instruct AWQ", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.12, + "output": 0.27 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-3.1-8b-instruct-fp8", + "name": "Llama 3.1 8B Instruct FP8", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.29 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11B Vision Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.049, + "output": 0.68 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.027, + "output": 0.2 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.051, + "output": 0.34 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-3.3-70b-instruct-fp8-fast", + "name": "Llama 3.3 70B Instruct FP8 Fast", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.29, + "output": 2.25 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.85 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.48, + "output": 0.03 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/meta/m2m100-1.2b", + "name": "M2M100 1.2B", + "family": "m2m", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.34, + "output": 0.34 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/mistral/mistral-7b-instruct-v0.1", + "name": "Mistral 7B Instruct v0.1", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.11, + "output": 0.19 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/mistralai/mistral-small-3.1-24b-instruct", + "name": "Mistral Small 3.1 24B Instruct", + "family": "mistral-small", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.35, + "output": 0.56 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/myshell-ai/melotts", + "name": "MyShell MeloTTS", + "family": "melotts", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.35, + "output": 0.75 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/pfnet/plamo-embedding-1b", + "name": "PLaMo Embedding 1B", + "family": "plamo", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.019, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/pipecat-ai/smart-turn-v2", + "name": "Pipecat Smart Turn v2", + "family": "smart-turn", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/qwen/qwen2.5-coder-32b-instruct", + "name": "Qwen 2.5 Coder 32B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.66, + "output": 1.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B FP8", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.051, + "output": 0.34 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/qwen/qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.012, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-ai-gateway/workers-ai/@cf/qwen/qwq-32b", + "name": "QwQ 32B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.66, + "output": 1.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/ai4bharat/indictrans2-en-indic-1B", + "name": "IndicTrans2 EN-Indic 1B", + "family": "indictrans", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.34, + "output": 0.34 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/aisingapore/gemma-sea-lion-v4-27b-it", + "name": "Gemma SEA-LION v4 27B IT", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.35, + "output": 0.56 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/baai/bge-base-en-v1.5", + "name": "BGE Base EN v1.5", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.067, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/baai/bge-large-en-v1.5", + "name": "BGE Large EN v1.5", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/baai/bge-m3", + "name": "BGE M3", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.012, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/baai/bge-reranker-base", + "name": "BGE Reranker Base", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-09", + "last_updated": "2025-04-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0031, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/baai/bge-small-en-v1.5", + "name": "BGE Small EN v1.5", + "family": "bge", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.02, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/deepgram/aura-2-en", + "name": "Deepgram Aura 2 (EN)", + "family": "aura", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/deepgram/aura-2-es", + "name": "Deepgram Aura 2 (ES)", + "family": "aura", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/deepgram/nova-3", + "name": "Deepgram Nova 3", + "family": "nova", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/deepseek-ai/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 4.88 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/facebook/bart-large-cnn", + "name": "BART Large CNN", + "family": "bart", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-09", + "last_updated": "2025-04-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/google/gemma-3-12b-it", + "name": "Gemma 3 12B IT", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.35, + "output": 0.56 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/huggingface/distilbert-sst-2-int8", + "name": "DistilBERT SST-2 INT8", + "family": "distilbert", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.026, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/ibm-granite/granite-4.0-h-micro", + "name": "IBM Granite 4.0 H Micro", + "family": "granite", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.017, + "output": 0.11 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-2-7b-chat-fp16", + "name": "Llama 2 7B Chat FP16", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.56, + "output": 6.67 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.28, + "output": 0.83 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-3-8b-instruct-awq", + "name": "Llama 3 8B Instruct AWQ", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.12, + "output": 0.27 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.28, + "output": 0.8299999999999998 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-3.1-8b-instruct-awq", + "name": "Llama 3.1 8B Instruct AWQ", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.12, + "output": 0.27 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-3.1-8b-instruct-fp8", + "name": "Llama 3.1 8B Instruct FP8", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.29 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11B Vision Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.049, + "output": 0.68 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.027, + "output": 0.2 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.051, + "output": 0.34 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-3.3-70b-instruct-fp8-fast", + "name": "Llama 3.3 70B Instruct FP8 Fast", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.29, + "output": 2.25 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.85 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.48, + "output": 0.03 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/meta/m2m100-1.2b", + "name": "M2M100 1.2B", + "family": "m2m", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.34, + "output": 0.34 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/mistral/mistral-7b-instruct-v0.1", + "name": "Mistral 7B Instruct v0.1", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.11, + "output": 0.19 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/mistralai/mistral-small-3.1-24b-instruct", + "name": "Mistral Small 3.1 24B Instruct", + "family": "mistral-small", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.35, + "output": 0.56 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/myshell-ai/melotts", + "name": "MyShell MeloTTS", + "family": "melotts", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.35, + "output": 0.75 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/pfnet/plamo-embedding-1b", + "name": "PLaMo Embedding 1B", + "family": "plamo", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.019, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/pipecat-ai/smart-turn-v2", + "name": "Pipecat Smart Turn v2", + "family": "smart-turn", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/qwen/qwen2.5-coder-32b-instruct", + "name": "Qwen 2.5 Coder 32B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.66, + "output": 1.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B FP8", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.051, + "output": 0.34 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/qwen/qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.012, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cloudflare-workers-ai/@cf/qwen/qwq-32b", + "name": "QwQ 32B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.66, + "output": 1.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "cohere/c4ai-aya-expanse-32b", + "name": "Aya Expanse 32B", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-10-24", + "last_updated": "2024-10-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "cohere/c4ai-aya-expanse-8b", + "name": "Aya Expanse 8B", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-10-24", + "last_updated": "2024-10-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 8000, + "output": 4000 + } + }, + { + "id": "cohere/c4ai-aya-vision-32b", + "name": "Aya Vision 32B", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-04", + "last_updated": "2025-05-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 16000, + "output": 4000 + } + }, + { + "id": "cohere/c4ai-aya-vision-8b", + "name": "Aya Vision 8B", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-04", + "last_updated": "2025-05-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 16000, + "output": 4000 + } + }, + { + "id": "cohere/command-a-03", + "name": "Command A", + "family": "command-a", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 256000, + "output": 8000 + } + }, + { + "id": "cohere/command-a-reasoning-08", + "name": "Command A Reasoning", + "family": "command-a", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "cohere/command-a-translate-08", + "name": "Command A Translate", + "family": "command-a", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 8000, + "output": 8000 + } + }, + { + "id": "cohere/command-a-vision-07", + "name": "Command A Vision", + "family": "command-a", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 128000, + "output": 8000 + } + }, + { + "id": "cohere/command-r-08", + "name": "Command R", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "cohere/command-r-plus-08", + "name": "Command R+", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "cohere/command-r7b-12", + "name": "Command R7B", + "family": "command-r", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2024-02-27", + "last_updated": "2024-02-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0375, + "output": 0.15 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "cohere/command-r7b-arabic-02", + "name": "Command R7B Arabic", + "family": "command-r", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06-01", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0375, + "output": 0.15 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "cortecs/claude-4.5-sonnet", + "name": "Claude 4.5 Sonnet", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.259, + "output": 16.296 + }, + "limit": { + "context": 200000, + "output": 200000 + } + }, + { + "id": "cortecs/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.307, + "output": 16.536 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "cortecs/deepseek-v3", + "name": "DeepSeek V3 0324", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.551, + "output": 1.654 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "cortecs/devstral", + "name": "Devstral 2 2512", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "cortecs/devstral-small", + "name": "Devstral Small 2 2512", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "cortecs/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.654, + "output": 11.024 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "cortecs/glm-4p5", + "name": "GLM 4.5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.67, + "output": 2.46 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "cortecs/glm-4p5-air", + "name": "GLM 4.5 Air", + "family": "glm-air", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 1.34 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "cortecs/glm-4p7", + "name": "GLM 4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.45, + "output": 2.23 + }, + "limit": { + "context": 198000, + "output": 198000 + } + }, + { + "id": "cortecs/gpt-4.1", + "name": "GPT 4.1", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.354, + "output": 9.417 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "cortecs/gpt-oss-120b", + "name": "GPT Oss 120b", + "family": "gpt-oss", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "cortecs/intellect-3", + "name": "INTELLECT 3", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.219, + "output": 1.202 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "cortecs/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-07-11", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.551, + "output": 2.646 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "cortecs/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.656, + "output": 2.731 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "cortecs/llama-3.1-405b-instruct", + "name": "Llama 3.1 405B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "cortecs/minimax-m2", + "name": "MiniMax-M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.39, + "output": 1.57 + }, + "limit": { + "context": 400000, + "output": 400000 + } + }, + { + "id": "cortecs/minimax-m2p1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.34, + "output": 1.34 + }, + "limit": { + "context": 196000, + "output": 196000 + } + }, + { + "id": "cortecs/nova-pro-v1", + "name": "Nova Pro 1.0", + "family": "nova-pro", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.016, + "output": 4.061 + }, + "limit": { + "context": 300000, + "output": 5000 + } + }, + { + "id": "cortecs/qwen3-32b", + "name": "Qwen3 32B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.099, + "output": 0.33 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "cortecs/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.441, + "output": 1.984 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "cortecs/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.164, + "output": 1.311 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "deepinfra/MiniMaxAI/MiniMax-M2", + "name": "MiniMax M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.254, + "output": 1.02 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "deepinfra/MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.28, + "output": 1.2 + }, + "limit": { + "context": 196608, + "output": 196608 + } + }, + { + "id": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.6 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "deepinfra/anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7 (Latest)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-31", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.3, + "output": 16.5, + "cache_read": 0.33 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "deepinfra/anthropic/claude-4-opus", + "name": "Claude Opus 4", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-06-12", + "last_updated": "2025-06-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 16.5, + "output": 82.5 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "deepinfra/deepseek-ai/DeepSeek-R1", + "name": "DeepSeek-R1-0528", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.15, + "cache_read": 0.35 + }, + "limit": { + "context": 163840, + "output": 64000 + } + }, + { + "id": "deepinfra/deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.26, + "output": 0.38, + "cache_read": 0.13 + }, + "limit": { + "context": 163840, + "output": 64000 + } + }, + { + "id": "deepinfra/moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "deepinfra/moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-11-06", + "last_updated": "2025-11-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.47, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "deepinfra/moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 2.8 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "deepinfra/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.24 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "deepinfra/openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.14 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "deepinfra/zai-org/GLM-4.5", + "name": "GLM-4.5", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 131072, + "output": 98304 + } + }, + { + "id": "deepinfra/zai-org/GLM-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.43, + "output": 1.75, + "cache_read": 0.08 + }, + "limit": { + "context": 202752, + "output": 16384 + } + }, + { + "id": "deepinfra/zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "family": "glm-flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.4 + }, + "limit": { + "context": 202752, + "output": 16384 + } + }, + { + "id": "deepseek/deepseek-chat", + "name": "DeepSeek Chat", + "family": "deepseek", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.28, + "output": 0.42, + "cache_read": 0.028 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "deepseek/deepseek-reasoner", + "name": "DeepSeek Reasoner", + "family": "deepseek-thinking", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.28, + "output": 0.42, + "cache_read": 0.028 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "evroc/KBLab/kb-whisper-large", + "name": "KB Whisper", + "family": "whisper", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2024-10-01", + "last_updated": "2024-10-01", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.00236, + "output": 0.00236 + }, + "limit": { + "context": 448, + "output": 448 + } + }, + { + "id": "evroc/Qwen/Qwen3-30B-A3B-Instruct-2507-FP8", + "name": "Qwen3 30B 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.35, + "output": 1.42 + }, + "limit": { + "context": 64000, + "output": 64000 + } + }, + { + "id": "evroc/Qwen/Qwen3-Embedding-8B", + "name": "Qwen3 Embedding 8B", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.12, + "output": 0.12 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "evroc/Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen3 VL 30B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.24, + "output": 0.94 + }, + "limit": { + "context": 100000, + "output": 100000 + } + }, + { + "id": "evroc/intfloat/multilingual-e5-large-instruct", + "name": "E5 Multi-Lingual Large Embeddings 0.6B", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.12, + "output": 0.12 + }, + "limit": { + "context": 512, + "output": 512 + } + }, + { + "id": "evroc/microsoft/Phi-4-multimodal-instruct", + "name": "Phi-4 15B", + "family": "phi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": true, + "cost": { + "input": 0.24, + "output": 0.47 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "evroc/mistralai/Magistral-Small", + "name": "Magistral Small 1.2 24B", + "family": "magistral-small", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.59, + "output": 2.36 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "evroc/mistralai/Voxtral-Small-24B", + "name": "Voxtral Small 24B", + "family": "voxtral", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", + "modalities": { + "input": [ + "audio", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.00236, + "output": 0.00236 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "evroc/mistralai/devstral-small-2-24b-instruct", + "name": "Devstral Small 2 24B Instruct 2512", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.12, + "output": 0.47 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "evroc/moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.47, + "output": 5.9 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "evroc/nvidia/Llama-3.3-70B-Instruct-FP8", + "name": "Llama 3.3 70B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.18, + "output": 1.18 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "evroc/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.24, + "output": 0.94 + }, + "limit": { + "context": 65536, + "output": 65536 + } + }, + { + "id": "evroc/openai/whisper-large-v3", + "name": "Whisper 3 Large", + "family": "whisper", + "attachment": false, + "reasoning": false, + "tool_call": false, + "release_date": "2024-10-01", + "last_updated": "2024-10-01", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.00236, + "output": 0.00236 + }, + "limit": { + "context": 448, + "output": 4096 + } + }, + { + "id": "fastrouter/anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "fastrouter/anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "fastrouter/deepseek-ai/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-01-23", + "last_updated": "2025-01-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.14 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "fastrouter/google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.0375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "fastrouter/google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "fastrouter/moonshotai/kimi-k2", + "name": "Kimi K2", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.2 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "fastrouter/openai/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "fastrouter/openai/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "fastrouter/openai/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "fastrouter/openai/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "fastrouter/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "fastrouter/openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.2 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "fastrouter/qwen/qwen3-coder", + "name": "Qwen3 Coder", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "fastrouter/x-ai/grok-4", + "name": "Grok 4", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75, + "cache_write": 15.0 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/deepseek-v3p1", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.56, + "output": 1.68 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/deepseek-v3p2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.56, + "output": 1.68, + "cache_read": 0.28 + }, + "limit": { + "context": 160000, + "output": 160000 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/glm-4p5", + "name": "GLM 4.5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.19 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/glm-4p5-air", + "name": "GLM 4.5 Air", + "family": "glm-air", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 0.88 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/glm-4p7", + "name": "GLM 4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.3 + }, + "limit": { + "context": 198000, + "output": 198000 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/glm-5", + "name": "GLM 5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.2, + "cache_read": 0.5 + }, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/gpt-oss-20b", + "name": "GPT OSS 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.2 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.3 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/kimi-k2p5", + "name": "Kimi K2.5", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0, + "cache_read": 0.1 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/minimax-m2p1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 + }, + "limit": { + "context": 200000, + "output": 200000 + } + }, + { + "id": "fireworks-ai/accounts/fireworks/models/minimax-m2p5", + "name": "MiniMax-M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 + }, + "limit": { + "context": 196608, + "output": 196608 + } + }, + { + "id": "firmware/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "firmware/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "firmware/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "firmware/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "firmware/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2026-02-17", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "firmware/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-07-17", + "last_updated": "2025-07-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "firmware/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "firmware/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0, + "cache_read": 0.05 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "firmware/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "firmware/gpt-4o", + "name": "GPT-4o", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 10.0, + "cache_read": 1.25 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "firmware/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "firmware/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.03 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "firmware/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "firmware/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "firmware/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "1970-01-01", + "last_updated": "1970-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "firmware/gpt-oss-20b", + "name": "GPT OSS 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "1970-01-01", + "last_updated": "1970-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.2 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "friendli/LGAI-EXAONE/EXAONE-4.0.1-32B", + "name": "EXAONE 4.0.1 32B", + "family": "exaone", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-31", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "friendli/LGAI-EXAONE/K-EXAONE-236B-A23B", + "name": "K EXAONE 236B A23B", + "family": "exaone", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-31", + "last_updated": "2026-01-08", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "friendli/MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-13", + "last_updated": "2026-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 196608, + "output": 196608 + } + }, + { + "id": "friendli/Qwen/Qwen3-235B-A22B-Instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-29", + "last_updated": "2026-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "friendli/meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-08-01", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 131072, + "output": 8000 + } + }, + { + "id": "friendli/meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-08-01", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 0.6 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "friendli/zai-org/GLM-4.7", + "name": "GLM 4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-22", + "last_updated": "2026-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 202752, + "output": 202752 + } + }, + { + "id": "friendli/zai-org/GLM-5", + "name": "GLM 5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.2 + }, + "limit": { + "context": 202752, + "output": 202752 + } + }, + { + "id": "github-copilot/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "github-copilot/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "github-copilot/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "github-copilot/claude-opus-41", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 80000, + "output": 16000 + } + }, + { + "id": "github-copilot/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16000 + } + }, + { + "id": "github-copilot/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "github-copilot/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "github-copilot/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "github-copilot/gemini-3-flash-preview", + "name": "Gemini 3 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "github-copilot/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "github-copilot/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "github-copilot/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 64000, + "output": 16384 + } + }, + { + "id": "github-copilot/gpt-4o", + "name": "GPT-4o", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 64000, + "output": 16384 + } + }, + { + "id": "github-copilot/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "github-copilot/gpt-5-mini", + "name": "GPT-5-mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "github-copilot/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "github-copilot/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "github-copilot/gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-max", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "github-copilot/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-mini", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "github-copilot/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "github-copilot/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 272000, + "output": 128000 + } + }, + { + "id": "github-copilot/grok-code-fast-1", + "name": "Grok Code Fast 1", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-08-27", + "last_updated": "2025-08-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "github-models/ai21-labs/ai21-jamba-1.5-large", + "name": "AI21 Jamba 1.5 Large", + "family": "jamba", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 4096 + } + }, + { + "id": "github-models/ai21-labs/ai21-jamba-1.5-mini", + "name": "AI21 Jamba 1.5 Mini", + "family": "jamba", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 4096 + } + }, + { + "id": "github-models/cohere/cohere-command-a", + "name": "Cohere Command A", + "family": "command-a", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/cohere/cohere-command-r", + "name": "Cohere Command R", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-03-11", + "last_updated": "2024-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/cohere/cohere-command-r-08", + "name": "Cohere Command R 08-2024", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/cohere/cohere-command-r-plus", + "name": "Cohere Command R+", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-04-04", + "last_updated": "2024-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/cohere/cohere-command-r-plus-08", + "name": "Cohere Command R+ 08-2024", + "family": "command-r", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/core42/jais-30b-chat", + "name": "JAIS 30b Chat", + "family": "jais", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-03", + "release_date": "2023-08-30", + "last_updated": "2023-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "github-models/deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 65536, + "output": 8192 + } + }, + { + "id": "github-models/deepseek/deepseek-v3", + "name": "DeepSeek-V3-0324", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "github-models/meta/llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "github-models/meta/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "github-models/meta/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "github-models/meta/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "github-models/meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "github-models/meta/meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "github-models/meta/meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "github-models/meta/meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "github-models/meta/meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "github-models/meta/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "github-models/microsoft/mai-ds-r1", + "name": "MAI-DS-R1", + "family": "mai", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 65536, + "output": 8192 + } + }, + { + "id": "github-models/microsoft/phi-3-medium-128k-instruct", + "name": "Phi-3-medium instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/microsoft/phi-3-medium-4k-instruct", + "name": "Phi-3-medium instruct (4k)", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 4096, + "output": 1024 + } + }, + { + "id": "github-models/microsoft/phi-3-mini-128k-instruct", + "name": "Phi-3-mini instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/microsoft/phi-3-mini-4k-instruct", + "name": "Phi-3-mini instruct (4k)", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 4096, + "output": 1024 + } + }, + { + "id": "github-models/microsoft/phi-3-small-128k-instruct", + "name": "Phi-3-small instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/microsoft/phi-3-small-8k-instruct", + "name": "Phi-3-small instruct (8k)", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "github-models/microsoft/phi-3.5-mini-instruct", + "name": "Phi-3.5-mini instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/microsoft/phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/microsoft/phi-3.5-vision-instruct", + "name": "Phi-3.5-vision instruct (128k)", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/microsoft/phi-4", + "name": "Phi-4-Reasoning", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/microsoft/phi-4-mini", + "name": "Phi-4-mini-reasoning", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/microsoft/phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/microsoft/phi-4-multimodal-instruct", + "name": "Phi-4-multimodal-instruct", + "family": "phi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "github-models/mistral-ai/codestral", + "name": "Codestral 25.01", + "family": "codestral", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32000, + "output": 8192 + } + }, + { + "id": "github-models/mistral-ai/ministral-3b", + "name": "Ministral 3B", + "family": "ministral", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "github-models/mistral-ai/mistral-large", + "name": "Mistral Large 24.11", + "family": "mistral-large", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "github-models/mistral-ai/mistral-medium", + "name": "Mistral Medium 3 (25.05)", + "family": "mistral-medium", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "github-models/mistral-ai/mistral-nemo", + "name": "Mistral Nemo", + "family": "mistral-nemo", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "github-models/mistral-ai/mistral-small", + "name": "Mistral Small 3.1", + "family": "mistral-small", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "github-models/openai/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "github-models/openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "github-models/openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "github-models/openai/gpt-4o", + "name": "GPT-4o", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "github-models/openai/gpt-4o-mini", + "name": "GPT-4o mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "github-models/openai/o1", + "name": "OpenAI o1", + "family": "o", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "github-models/openai/o1-mini", + "name": "OpenAI o1-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 65536 + } + }, + { + "id": "github-models/openai/o1-preview", + "name": "OpenAI o1-preview", + "family": "o", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "github-models/openai/o3", + "name": "OpenAI o3", + "family": "o", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "github-models/openai/o3-mini", + "name": "OpenAI o3-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "github-models/openai/o4-mini", + "name": "OpenAI o4-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "github-models/xai/grok-3", + "name": "Grok 3", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "github-models/xai/grok-3-mini", + "name": "Grok 3 Mini", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "gitlab/duo-chat-gpt-5-codex", + "name": "Agentic Chat (GPT-5 Codex)", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "gitlab/duo-chat-gpt-5-mini", + "name": "Agentic Chat (GPT-5 Mini)", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "gitlab/duo-chat-gpt-5.1", + "name": "Agentic Chat (GPT-5.1)", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "gitlab/duo-chat-gpt-5.2", + "name": "Agentic Chat (GPT-5.2)", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "gitlab/duo-chat-gpt-5.2-codex", + "name": "Agentic Chat (GPT-5.2 Codex)", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "gitlab/duo-chat-haiku-4.5", + "name": "Agentic Chat (Claude Haiku 4.5)", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "gitlab/duo-chat-opus-4.5", + "name": "Agentic Chat (Claude Opus 4.5)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "gitlab/duo-chat-opus-4.6", + "name": "Agentic Chat (Claude Opus 4.6)", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "gitlab/duo-chat-sonnet-4.5", + "name": "Agentic Chat (Claude Sonnet 4.5)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "gitlab/duo-chat-sonnet-4.6", + "name": "Agentic Chat (Claude Sonnet 4.6)", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "google-vertex-anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "google-vertex-anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "google-vertex-anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "google-vertex-anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "google-vertex-anthropic/claude-opus-4", + "name": "Claude Opus 4", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "google-vertex-anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "google-vertex-anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "google-vertex-anthropic/claude-opus-4.6@default", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "google-vertex-anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "google-vertex-anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "google-vertex-anthropic/claude-sonnet-4.6@default", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "google-vertex/deepseek-ai/deepseek-v3.1-maas", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "modalities": { + "input": [ + "text", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.7 + }, + "limit": { + "context": 163840, + "output": 32768 + } + }, + { + "id": "google-vertex/gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "google-vertex/gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.075, + "output": 0.3 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "google-vertex/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 65536, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-2.5-flash-lite-preview-09", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-2.5-flash-preview-09", + "name": "Gemini 2.5 Flash Preview 09-25", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0, + "cache_read": 0.05 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-embedding-001", + "name": "Gemini Embedding 001", + "family": "gemini", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.0 + }, + "limit": { + "context": 2048, + "output": 3072 + } + }, + { + "id": "google-vertex/gemini-flash", + "name": "Gemini Flash Latest", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/gemini-flash-lite", + "name": "Gemini Flash-Lite Latest", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google-vertex/meta/llama-3.3-70b-instruct-maas", + "name": "Llama 3.3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.72, + "output": 0.72 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "google-vertex/meta/llama-4-maverick-17b-128e-instruct-maas", + "name": "Llama 4 Maverick 17B 128E Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.35, + "output": 1.15 + }, + "limit": { + "context": 524288, + "output": 8192 + } + }, + { + "id": "google-vertex/openai/gpt-oss-120b-maas", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.36 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "google-vertex/openai/gpt-oss-20b-maas", + "name": "GPT OSS 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.25 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "google-vertex/qwen/qwen3-235b-a22b-instruct-2507-maas", + "name": "Qwen3 235B A22B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-13", + "last_updated": "2025-08-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 0.88 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "google-vertex/zai-org/glm-4.7-maas", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-01-06", + "last_updated": "2026-01-06", + "modalities": { + "input": [ + "text", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "google-vertex/zai-org/glm-5-maas", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.2, + "cache_read": 0.1 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "google/gemini-1.5-flash", + "name": "Gemini 1.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-05-14", + "last_updated": "2024-05-14", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.075, + "output": 0.3, + "cache_read": 0.01875 + }, + "limit": { + "context": 1000000, + "output": 8192 + } + }, + { + "id": "google/gemini-1.5-flash-8b", + "name": "Gemini 1.5 Flash-8B", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-10-03", + "last_updated": "2024-10-03", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0375, + "output": 0.15, + "cache_read": 0.01 + }, + "limit": { + "context": 1000000, + "output": 8192 + } + }, + { + "id": "google/gemini-1.5-pro", + "name": "Gemini 1.5 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-02-15", + "last_updated": "2024-02-15", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 5.0, + "cache_read": 0.3125 + }, + "limit": { + "context": 1000000, + "output": 8192 + } + }, + { + "id": "google/gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "google/gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.075, + "output": 0.3 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 30.0, + "cache_read": 0.075 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "google/gemini-2.5-flash-image-preview", + "name": "Gemini 2.5 Flash Image (Preview)", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 30.0, + "cache_read": 0.075 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-flash-lite-preview-09", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-flash-preview-09", + "name": "Gemini 2.5 Flash Preview 09-25", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-flash-preview-tts", + "name": "Gemini 2.5 Flash Preview TTS", + "family": "gemini-flash", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 10.0 + }, + "limit": { + "context": 8000, + "output": 16000 + } + }, + { + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-2.5-pro-preview-tts", + "name": "Gemini 2.5 Pro Preview TTS", + "family": "gemini-flash", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 20.0 + }, + "limit": { + "context": 8000, + "output": 16000 + } + }, + { + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0, + "cache_read": 0.05 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-embedding-001", + "name": "Gemini Embedding 001", + "family": "gemini", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.0 + }, + "limit": { + "context": 2048, + "output": 3072 + } + }, + { + "id": "google/gemini-flash", + "name": "Gemini Flash Latest", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-flash-lite", + "name": "Gemini Flash-Lite Latest", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "google/gemini-live-2.5-flash", + "name": "Gemini Live 2.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8000 + } + }, + { + "id": "google/gemini-live-2.5-flash-preview-native-audio", + "name": "Gemini Live 2.5 Flash Preview Native Audio", + "family": "gemini-flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-09-18", + "modalities": { + "input": [ + "text", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "groq/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.75, + "output": 0.99 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "groq/gemma2-9b-it", + "name": "Gemma 2 9B", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-06-27", + "last_updated": "2024-06-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "groq/llama-3.1-8b-instant", + "name": "Llama 3.1 8B Instant", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.08 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "groq/llama-3.3-70b-versatile", + "name": "Llama 3.3 70B Versatile", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.59, + "output": 0.79 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "groq/llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "groq/llama3-70b", + "name": "Llama 3 70B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-03", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.59, + "output": 0.79 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "groq/llama3-8b", + "name": "Llama 3 8B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-03", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.08 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "groq/meta-llama/llama-4-maverick-17b-128e-instruct", + "name": "Llama 4 Maverick 17B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "groq/meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.11, + "output": 0.34 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "groq/meta-llama/llama-guard-4-12b", + "name": "Llama Guard 4 12B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 131072, + "output": 1024 + } + }, + { + "id": "groq/mistral-saba-24b", + "name": "Mistral Saba 24B", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-02-06", + "last_updated": "2025-02-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.79, + "output": 0.79 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "groq/moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.0 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "groq/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "groq/openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.075, + "output": 0.3 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "groq/qwen-qwq-32b", + "name": "Qwen QwQ 32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-11-27", + "last_updated": "2024-11-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.29, + "output": 0.39 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "groq/qwen/qwen3-32b", + "name": "Qwen3 32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11-08", + "release_date": "2024-12-23", + "last_updated": "2024-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.29, + "output": 0.59 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "helicone/chatgpt-4o", + "name": "OpenAI ChatGPT-4o", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2024-08-14", + "last_updated": "2024-08-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 20.0, + "cache_read": 2.5 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "helicone/claude-3-haiku", + "name": "Anthropic: Claude 3 Haiku", + "family": "claude-haiku", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-03", + "release_date": "2024-03-07", + "last_updated": "2024-03-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "helicone/claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "family": "claude-haiku", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.7999999999999999, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "helicone/claude-3.5-sonnet-v2", + "name": "Anthropic: Claude 3.5 Sonnet v2", + "family": "claude-sonnet", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "helicone/claude-3.7-sonnet", + "name": "Anthropic: Claude 3.7 Sonnet", + "family": "claude-sonnet", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "helicone/claude-4.5-haiku", + "name": "Anthropic: Claude 4.5 Haiku", + "family": "claude-haiku", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "helicone/claude-4.5-opus", + "name": "Anthropic: Claude Opus 4.5", + "family": "claude-opus", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "helicone/claude-4.5-sonnet", + "name": "Anthropic: Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "helicone/claude-haiku-4.5", + "name": "Anthropic: Claude 4.5 Haiku (20251001)", + "family": "claude-haiku", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "helicone/claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "family": "claude-opus", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "helicone/claude-opus-4.1", + "name": "Anthropic: Claude Opus 4.1 (20250805)", + "family": "claude-opus", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "helicone/claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "helicone/claude-sonnet-4.5", + "name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "family": "claude-sonnet", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "helicone/codex-mini", + "name": "OpenAI Codex Mini Latest", + "family": "gpt-codex-mini", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.5, + "output": 6.0, + "cache_read": 0.375 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "helicone/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.03, + "output": 0.13 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "helicone/deepseek-reasoner", + "name": "DeepSeek Reasoner", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "helicone/deepseek-tng-r1t2-chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-02", + "last_updated": "2025-07-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 130000, + "output": 163840 + } + }, + { + "id": "helicone/deepseek-v3", + "name": "DeepSeek V3", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "helicone/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 1.0, + "cache_read": 0.21600000000000003 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "helicone/deepseek-v3.2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.41 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "helicone/ernie-4.5-21b-a3b-thinking", + "name": "Baidu Ernie 4.5 21B A3B Thinking", + "family": "ernie", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-03-16", + "last_updated": "2025-03-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 128000, + "output": 8000 + } + }, + { + "id": "helicone/gemini-2.5-flash", + "name": "Google Gemini 2.5 Flash", + "family": "gemini-flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.3 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "helicone/gemini-2.5-flash-lite", + "name": "Google Gemini 2.5 Flash Lite", + "family": "gemini-flash-lite", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998, + "cache_write": 0.09999999999999999 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "helicone/gemini-2.5-pro", + "name": "Google Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.3125, + "cache_write": 1.25 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "helicone/gemini-3-pro-preview", + "name": "Google Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.19999999999999998 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "helicone/gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.049999999999999996, + "output": 0.09999999999999999 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "helicone/gemma2-9b-it", + "name": "Google Gemma 2", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-06-25", + "last_updated": "2024-06-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.01, + "output": 0.03 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "helicone/glm-4.6", + "name": "Zai GLM-4.6", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.44999999999999996, + "output": 1.5 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "helicone/gpt-4.1", + "name": "OpenAI GPT-4.1", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "helicone/gpt-4.1-mini", + "name": "OpenAI GPT-4.1 Mini", + "family": "gpt-mini", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "helicone/gpt-4.1-nano", + "name": "OpenAI GPT-4.1 Nano", + "family": "gpt-nano", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "helicone/gpt-4o", + "name": "OpenAI GPT-4o", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 10.0, + "cache_read": 1.25 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "helicone/gpt-4o-mini", + "name": "OpenAI GPT-4o-mini", + "family": "gpt-mini", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "helicone/gpt-5", + "name": "OpenAI GPT-5", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.12500000000000003 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "helicone/gpt-5-chat", + "name": "OpenAI GPT-5 Chat Latest", + "family": "gpt-codex", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09", + "release_date": "2024-09-30", + "last_updated": "2024-09-30", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.12500000000000003 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "helicone/gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.12500000000000003 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "helicone/gpt-5-mini", + "name": "OpenAI GPT-5 Mini", + "family": "gpt-mini", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.024999999999999998 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "helicone/gpt-5-nano", + "name": "OpenAI GPT-5 Nano", + "family": "gpt-nano", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.049999999999999996, + "output": 0.39999999999999997, + "cache_read": 0.005 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "helicone/gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "family": "gpt-pro", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 120.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "helicone/gpt-5.1", + "name": "OpenAI GPT-5.1", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.12500000000000003 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "helicone/gpt-5.1-chat", + "name": "OpenAI GPT-5.1 Chat", + "family": "gpt-codex", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.12500000000000003 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "helicone/gpt-5.1-codex", + "name": "OpenAI: GPT-5.1 Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.12500000000000003 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "helicone/gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1 Codex Mini", + "family": "gpt-codex", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.024999999999999998 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "helicone/gpt-oss-120b", + "name": "OpenAI GPT-OSS 120b", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.04, + "output": 0.16 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "helicone/gpt-oss-20b", + "name": "OpenAI GPT-OSS 20b", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.049999999999999996, + "output": 0.19999999999999998 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "helicone/grok-3", + "name": "xAI Grok 3", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "helicone/grok-3-mini", + "name": "xAI Grok 3 Mini", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "helicone/grok-4", + "name": "xAI Grok 4", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-09", + "last_updated": "2024-07-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "helicone/grok-4-fast", + "name": "xAI: Grok 4 Fast Reasoning", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 + }, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "helicone/grok-4-fast-non", + "name": "xAI Grok 4 Fast Non-Reasoning", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 + }, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "helicone/grok-4.1-fast", + "name": "xAI Grok 4.1 Fast Reasoning", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 + }, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "helicone/grok-4.1-fast-non", + "name": "xAI Grok 4.1 Fast Non-Reasoning", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 + }, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "helicone/grok-code-fast-1", + "name": "xAI Grok Code Fast 1", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2024-08-25", + "last_updated": "2024-08-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.19999999999999998, + "output": 1.5, + "cache_read": 0.02 + }, + "limit": { + "context": 256000, + "output": 10000 + } + }, + { + "id": "helicone/hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.14 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "helicone/kimi-k2", + "name": "Kimi K2 (09/05)", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.0, + "cache_read": 0.39999999999999997 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "helicone/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.48, + "output": 2.0 + }, + "limit": { + "context": 256000, + "output": 262144 + } + }, + { + "id": "helicone/llama-3.1-8b-instant", + "name": "Meta Llama 3.1 8B Instant", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.049999999999999996, + "output": 0.08 + }, + "limit": { + "context": 131072, + "output": 32678 + } + }, + { + "id": "helicone/llama-3.1-8b-instruct", + "name": "Meta Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.02, + "output": 0.049999999999999996 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "helicone/llama-3.1-8b-instruct-turbo", + "name": "Meta Llama 3.1 8B Instruct Turbo", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.02, + "output": 0.03 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "helicone/llama-3.3-70b-instruct", + "name": "Meta Llama 3.3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.13, + "output": 0.39 + }, + "limit": { + "context": 128000, + "output": 16400 + } + }, + { + "id": "helicone/llama-3.3-70b-versatile", + "name": "Meta Llama 3.3 70B Versatile", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.59, + "output": 0.7899999999999999 + }, + "limit": { + "context": 131072, + "output": 32678 + } + }, + { + "id": "helicone/llama-4-maverick", + "name": "Meta Llama 4 Maverick 17B 128E", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "helicone/llama-4-scout", + "name": "Meta Llama 4 Scout 17B 16E", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.08, + "output": 0.3 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "helicone/llama-guard-4", + "name": "Meta Llama Guard 4 12B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.21, + "output": 0.21 + }, + "limit": { + "context": 131072, + "output": 1024 + } + }, + { + "id": "helicone/llama-prompt-guard-2-22m", + "name": "Meta Llama Prompt Guard 2 22M", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.01, + "output": 0.01 + }, + "limit": { + "context": 512, + "output": 2 + } + }, + { + "id": "helicone/llama-prompt-guard-2-86m", + "name": "Meta Llama Prompt Guard 2 86M", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.01, + "output": 0.01 + }, + "limit": { + "context": 512, + "output": 2 + } + }, + { + "id": "helicone/mistral-large", + "name": "Mistral-Large", + "family": "mistral-large", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-24", + "last_updated": "2024-07-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 6.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "helicone/mistral-nemo", + "name": "Mistral Nemo", + "family": "mistral-nemo", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 20.0, + "output": 40.0 + }, + "limit": { + "context": 128000, + "output": 16400 + } + }, + { + "id": "helicone/mistral-small", + "name": "Mistral Small", + "family": "mistral-small", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-02", + "release_date": "2024-02-26", + "last_updated": "2024-02-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 75.0, + "output": 200.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "helicone/o1", + "name": "OpenAI: o1", + "family": "o", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 60.0, + "cache_read": 7.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "helicone/o1-mini", + "name": "OpenAI: o1-mini", + "family": "o-mini", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 128000, + "output": 65536 + } + }, + { + "id": "helicone/o3", + "name": "OpenAI o3", + "family": "o", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "helicone/o3-mini", + "name": "OpenAI o3 Mini", + "family": "o-mini", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2023-10", + "release_date": "2023-10-01", + "last_updated": "2023-10-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "helicone/o3-pro", + "name": "OpenAI o3 Pro", + "family": "o-pro", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 20.0, + "output": 80.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "helicone/o4-mini", + "name": "OpenAI o4 Mini", + "family": "o-mini", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "helicone/qwen2.5-coder-7b-fast", + "name": "Qwen2.5 Coder 7B fast", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-09-15", + "last_updated": "2024-09-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.03, + "output": 0.09 + }, + "limit": { + "context": 32000, + "output": 8192 + } + }, + { + "id": "helicone/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.9000000000000004 + }, + "limit": { + "context": 262144, + "output": 81920 + } + }, + { + "id": "helicone/qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.08, + "output": 0.29 + }, + "limit": { + "context": 41000, + "output": 41000 + } + }, + { + "id": "helicone/qwen3-32b", + "name": "Qwen3 32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.29, + "output": 0.59 + }, + "limit": { + "context": 131072, + "output": 40960 + } + }, + { + "id": "helicone/qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.22, + "output": 0.95 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "helicone/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09999999999999999, + "output": 0.3 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "helicone/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 1.4 + }, + "limit": { + "context": 262000, + "output": 16384 + } + }, + { + "id": "helicone/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.5 + }, + "limit": { + "context": 256000, + "output": 16384 + } + }, + { + "id": "helicone/sonar", + "name": "Perplexity Sonar", + "family": "sonar", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 1.0 + }, + "limit": { + "context": 127000, + "output": 4096 + } + }, + { + "id": "helicone/sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "family": "sonar-deep-research", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0 + }, + "limit": { + "context": 127000, + "output": 4096 + } + }, + { + "id": "helicone/sonar-pro", + "name": "Perplexity Sonar Pro", + "family": "sonar-pro", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "helicone/sonar-reasoning-pro", + "name": "Perplexity Sonar Reasoning Pro", + "family": "sonar-reasoning", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0 + }, + "limit": { + "context": 127000, + "output": 4096 + } + }, + { + "id": "huggingface/MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "huggingface/MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "huggingface/Qwen/Qwen3-235B-A22B-Thinking", + "name": "Qwen3-235B-A22B-Thinking-2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 3.0 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "huggingface/Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 2.0 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "huggingface/Qwen/Qwen3-Coder-Next", + "name": "Qwen3-Coder-Next", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.5 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "huggingface/Qwen/Qwen3-Embedding-4B", + "name": "Qwen 3 Embedding 4B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.0 + }, + "limit": { + "context": 32000, + "output": 2048 + } + }, + { + "id": "huggingface/Qwen/Qwen3-Embedding-8B", + "name": "Qwen 3 Embedding 8B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.0 + }, + "limit": { + "context": 32000, + "output": 4096 + } + }, + { + "id": "huggingface/Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "huggingface/Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 2.0 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "huggingface/Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-397B-A17B", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-02-01", + "last_updated": "2026-02-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.6 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "huggingface/XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo-V2-Flash", + "family": "mimo", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 262144, + "output": 4096 + } + }, + { + "id": "huggingface/deepseek-ai/DeepSeek-R1", + "name": "DeepSeek-R1-0528", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 3.0, + "output": 5.0 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "huggingface/deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.28, + "output": 0.4 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "huggingface/moonshotai/Kimi-K2-Instruct", + "name": "Kimi-K2-Instruct-0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.0 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "huggingface/moonshotai/Kimi-K2-Thinking", + "name": "Kimi-K2-Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "huggingface/moonshotai/Kimi-K2.5", + "name": "Kimi-K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0, + "cache_read": 0.1 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "huggingface/zai-org/GLM-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "huggingface/zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "huggingface/zai-org/GLM-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.2, + "cache_read": 0.2 + }, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "iflowcn/deepseek-r1", + "name": "DeepSeek-R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "iflowcn/deepseek-v3", + "name": "DeepSeek-V3", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "iflowcn/deepseek-v3.2", + "name": "DeepSeek-V3.2-Exp", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "iflowcn/glm-4.6", + "name": "GLM-4.6", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "iflowcn/kimi-k2", + "name": "Kimi-K2-0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "iflowcn/qwen3-235b", + "name": "Qwen3-235B-A22B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "iflowcn/qwen3-235b-a22b-instruct", + "name": "Qwen3-235B-A22B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "iflowcn/qwen3-235b-a22b-thinking", + "name": "Qwen3-235B-A22B-Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "iflowcn/qwen3-32b", + "name": "Qwen3-32B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "iflowcn/qwen3-coder-plus", + "name": "Qwen3-Coder-Plus", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "iflowcn/qwen3-max", + "name": "Qwen3-Max", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "iflowcn/qwen3-max-preview", + "name": "Qwen3-Max-Preview", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "iflowcn/qwen3-vl-plus", + "name": "Qwen3-VL-Plus", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "inception/mercury", + "name": "Mercury", + "family": "mercury", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2025-06-26", + "last_updated": "2025-07-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0, + "cache_read": 0.25, + "cache_write": 1.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "inception/mercury-coder", + "name": "Mercury Coder", + "family": "mercury", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2025-02-26", + "last_updated": "2025-07-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0, + "cache_read": 0.25, + "cache_write": 1.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "inference/google/gemma-3", + "name": "Google Gemma 3", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.3 + }, + "limit": { + "context": 125000, + "output": 4096 + } + }, + { + "id": "inference/meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.025, + "output": 0.025 + }, + "limit": { + "context": 16000, + "output": 4096 + } + }, + { + "id": "inference/meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11B Vision Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.055, + "output": 0.055 + }, + "limit": { + "context": 16000, + "output": 4096 + } + }, + { + "id": "inference/meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.01 + }, + "limit": { + "context": 16000, + "output": 4096 + } + }, + { + "id": "inference/meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.02 + }, + "limit": { + "context": 16000, + "output": 4096 + } + }, + { + "id": "inference/mistral/mistral-nemo-12b-instruct", + "name": "Mistral Nemo 12B Instruct", + "family": "mistral-nemo", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.038, + "output": 0.1 + }, + "limit": { + "context": 16000, + "output": 4096 + } + }, + { + "id": "inference/osmosis/osmosis-structure-0.6b", + "name": "Osmosis Structure 0.6B", + "family": "osmosis", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.5 + }, + "limit": { + "context": 4000, + "output": 2048 + } + }, + { + "id": "inference/qwen/qwen-2.5-7b-vision-instruct", + "name": "Qwen 2.5 7B Vision Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 125000, + "output": 4096 + } + }, + { + "id": "inference/qwen/qwen3-embedding-4b", + "name": "Qwen 3 Embedding 4B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.0 + }, + "limit": { + "context": 32000, + "output": 2048 + } + }, + { + "id": "io-net/Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar", + "name": "Qwen 3 Coder 480B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 0.95, + "cache_read": 0.11, + "cache_write": 0.44 + }, + "limit": { + "context": 106000, + "output": 4096 + } + }, + { + "id": "io-net/Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen 2.5 VL 32B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.22, + "cache_read": 0.025, + "cache_write": 0.1 + }, + "limit": { + "context": 32000, + "output": 4096 + } + }, + { + "id": "io-net/Qwen/Qwen3-235B-A22B-Thinking", + "name": "Qwen 3 235B Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.11, + "output": 0.6, + "cache_read": 0.055, + "cache_write": 0.22 + }, + "limit": { + "context": 262144, + "output": 4096 + } + }, + { + "id": "io-net/Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen 3 Next 80B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-10", + "last_updated": "2025-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.8, + "cache_read": 0.05, + "cache_write": 0.2 + }, + "limit": { + "context": 262144, + "output": 4096 + } + }, + { + "id": "io-net/deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 8.75, + "cache_read": 1.0, + "cache_write": 4.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "io-net/meta-llama/Llama-3.2-90B-Vision-Instruct", + "name": "Llama 3.2 90B Vision Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.35, + "output": 0.4, + "cache_read": 0.175, + "cache_write": 0.7 + }, + "limit": { + "context": 16000, + "output": 4096 + } + }, + { + "id": "io-net/meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.38, + "cache_read": 0.065, + "cache_write": 0.26 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "io-net/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.075, + "cache_write": 0.3 + }, + "limit": { + "context": 430000, + "output": 4096 + } + }, + { + "id": "io-net/mistralai/Devstral-Small", + "name": "Devstral Small 2505", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.22, + "cache_read": 0.025, + "cache_write": 0.1 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "io-net/mistralai/Magistral-Small", + "name": "Magistral Small 2506", + "family": "magistral-small", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 0.25, + "cache_write": 1.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "io-net/mistralai/Mistral-Large-Instruct", + "name": "Mistral Large Instruct 2411", + "family": "mistral-large", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 6.0, + "cache_read": 1.0, + "cache_write": 4.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "io-net/mistralai/Mistral-Nemo-Instruct", + "name": "Mistral Nemo Instruct 2407", + "family": "mistral-nemo", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.04, + "cache_read": 0.01, + "cache_write": 0.04 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "io-net/moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2 Instruct", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2024-09-05", + "last_updated": "2024-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.39, + "output": 1.9, + "cache_read": 0.195, + "cache_write": 0.78 + }, + "limit": { + "context": 32768, + "output": 4096 + } + }, + { + "id": "io-net/moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.55, + "output": 2.25, + "cache_read": 0.275, + "cache_write": 1.1 + }, + "limit": { + "context": 32768, + "output": 4096 + } + }, + { + "id": "io-net/openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.4, + "cache_read": 0.02, + "cache_write": 0.08 + }, + "limit": { + "context": 131072, + "output": 4096 + } + }, + { + "id": "io-net/openai/gpt-oss-20b", + "name": "GPT-OSS 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.14, + "cache_read": 0.015, + "cache_write": 0.06 + }, + "limit": { + "context": 64000, + "output": 4096 + } + }, + { + "id": "io-net/zai-org/GLM-4.6", + "name": "GLM 4.6", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-11-15", + "last_updated": "2024-11-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 1.75, + "cache_read": 0.2, + "cache_write": 0.8 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "jiekou/baidu/ernie-4.5-300b-a47b-paddle", + "name": "ERNIE 4.5 300B A47B", + "family": "ernie", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.28, + "output": 1.1 + }, + "limit": { + "context": 123000, + "output": 12000 + } + }, + { + "id": "jiekou/baidu/ernie-4.5-vl-424b-a47b", + "name": "ERNIE 4.5 VL 424B A47B", + "family": "ernie", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.42, + "output": 1.25 + }, + "limit": { + "context": 123000, + "output": 16000 + } + }, + { + "id": "jiekou/claude-haiku-4.5", + "name": "claude-haiku-4-5-20251001", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.9, + "output": 4.5 + }, + "limit": { + "context": 20000, + "output": 64000 + } + }, + { + "id": "jiekou/claude-opus-4", + "name": "claude-opus-4-20250514", + "family": "claude-opus", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 13.5, + "output": 67.5 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "jiekou/claude-opus-4.1", + "name": "claude-opus-4-1-20250805", + "family": "claude-opus", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 13.5, + "output": 67.5 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "jiekou/claude-opus-4.5", + "name": "claude-opus-4-5-20251101", + "family": "claude-opus", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 4.5, + "output": 22.5 + }, + "limit": { + "context": 200000, + "output": 65536 + } + }, + { + "id": "jiekou/claude-opus-4.6", + "name": "claude-opus-4-6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02", + "last_updated": "2026-02", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "jiekou/claude-sonnet-4", + "name": "claude-sonnet-4-20250514", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.7, + "output": 13.5 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "jiekou/claude-sonnet-4.5", + "name": "claude-sonnet-4-5-20250929", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.7, + "output": 13.5 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "jiekou/deepseek/deepseek-r1", + "name": "DeepSeek R1 0528", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 2.5 + }, + "limit": { + "context": 163840, + "output": 32768 + } + }, + { + "id": "jiekou/deepseek/deepseek-v3", + "name": "DeepSeek V3 0324", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.28, + "output": 1.14 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "jiekou/deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 163840, + "output": 32768 + } + }, + { + "id": "jiekou/gemini-2.5-flash", + "name": "gemini-2.5-flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 2.25 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "jiekou/gemini-2.5-flash-lite", + "name": "gemini-2.5-flash-lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.36 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "jiekou/gemini-2.5-flash-lite-preview-06-17", + "name": "gemini-2.5-flash-lite-preview-06-17", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "video", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.36 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "jiekou/gemini-2.5-flash-lite-preview-09", + "name": "gemini-2.5-flash-lite-preview-09-2025", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.36 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "jiekou/gemini-2.5-flash-preview-05-20", + "name": "gemini-2.5-flash-preview-05-20", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.135, + "output": 3.15 + }, + "limit": { + "context": 1048576, + "output": 200000 + } + }, + { + "id": "jiekou/gemini-2.5-pro", + "name": "gemini-2.5-pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.125, + "output": 9.0 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "jiekou/gemini-2.5-pro-preview-06-05", + "name": "gemini-2.5-pro-preview-06-05", + "family": "gemini-pro", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.125, + "output": 9.0 + }, + "limit": { + "context": 1048576, + "output": 200000 + } + }, + { + "id": "jiekou/gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "jiekou/gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.8, + "output": 10.8 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "jiekou/gpt-5-chat", + "name": "gpt-5-chat-latest", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.125, + "output": 9.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5-codex", + "name": "gpt-5-codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.125, + "output": 9.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5-mini", + "name": "gpt-5-mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.225, + "output": 1.8 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5-nano", + "name": "gpt-5-nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.045, + "output": 0.36 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5-pro", + "name": "gpt-5-pro", + "family": "gpt-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 13.5, + "output": 108.0 + }, + "limit": { + "context": 400000, + "output": 272000 + } + }, + { + "id": "jiekou/gpt-5.1", + "name": "gpt-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02", + "last_updated": "2026-02", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.125, + "output": 9.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5.1-codex", + "name": "gpt-5.1-codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.125, + "output": 9.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5.1-codex-max", + "name": "gpt-5.1-codex-max", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.125, + "output": 9.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5.1-codex-mini", + "name": "gpt-5.1-codex-mini", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.225, + "output": 1.8 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5.2", + "name": "gpt-5.2", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.575, + "output": 12.6 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5.2-codex", + "name": "gpt-5.2-codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/gpt-5.2-pro", + "name": "gpt-5.2-pro", + "family": "gpt-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 18.9, + "output": 151.2 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "jiekou/grok-4", + "name": "grok-4-0709", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.7, + "output": 13.5 + }, + "limit": { + "context": 256000, + "output": 8192 + } + }, + { + "id": "jiekou/grok-4-fast", + "name": "grok-4-fast-reasoning", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.45 + }, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "jiekou/grok-4-fast-non", + "name": "grok-4-fast-non-reasoning", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.45 + }, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "jiekou/grok-4.1-fast", + "name": "grok-4-1-fast-reasoning", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.45 + }, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "jiekou/grok-4.1-fast-non", + "name": "grok-4-1-fast-non-reasoning", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.45 + }, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "jiekou/grok-code-fast-1", + "name": "grok-code-fast-1", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 1.35 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "jiekou/minimax/minimax-m2.1", + "name": "Minimax M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "jiekou/minimaxai/minimax-m1-80k", + "name": "MiniMax M1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.2 + }, + "limit": { + "context": 1000000, + "output": 40000 + } + }, + { + "id": "jiekou/moonshotai/kimi-k2", + "name": "Kimi K2 0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "jiekou/moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.57, + "output": 2.3 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "jiekou/moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "jiekou/o3", + "name": "o3", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 40.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "jiekou/o3-mini", + "name": "o3-mini", + "family": "o", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "jiekou/o4-mini", + "name": "o4-mini", + "family": "o", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "jiekou/qwen/qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 40960, + "output": 20000 + } + }, + { + "id": "jiekou/qwen/qwen3-235b-a22b-instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.8 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "jiekou/qwen/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22b Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 3.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "jiekou/qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.45 + }, + "limit": { + "context": 40960, + "output": 20000 + } + }, + { + "id": "jiekou/qwen/qwen3-32b-fp8", + "name": "Qwen3 32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.45 + }, + "limit": { + "context": 40960, + "output": 20000 + } + }, + { + "id": "jiekou/qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.29, + "output": 1.2 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "jiekou/qwen/qwen3-coder-next", + "name": "qwen/qwen3-coder-next", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-02", + "last_updated": "2026-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.5 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "jiekou/qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 1.5 + }, + "limit": { + "context": 65536, + "output": 65536 + } + }, + { + "id": "jiekou/qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 1.5 + }, + "limit": { + "context": 65536, + "output": 65536 + } + }, + { + "id": "jiekou/xiaomimimo/mimo-v2-flash", + "name": "XiaomiMiMo/MiMo-V2-Flash", + "family": "mimo", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "jiekou/zai-org/glm-4.5", + "name": "GLM-4.5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 131072, + "output": 98304 + } + }, + { + "id": "jiekou/zai-org/glm-4.5v", + "name": "GLM 4.5V", + "family": "glmv", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.8 + }, + "limit": { + "context": 65536, + "output": 16384 + } + }, + { + "id": "jiekou/zai-org/glm-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "jiekou/zai-org/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.4 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "kilo/allenai/molmo-2-8b", + "name": "AllenAI: Molmo2 8B", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2026-01-09", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 36864, + "output": 36864 + } + }, + { + "id": "kilo/amazon/nova-2-lite-v1", + "name": "Amazon: Nova 2 Lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5 + }, + "limit": { + "context": 1000000, + "output": 65535 + } + }, + { + "id": "kilo/amazon/nova-pro-v1", + "name": "Amazon: Nova Pro 1.0", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 3.2 + }, + "limit": { + "context": 300000, + "output": 5120 + } + }, + { + "id": "kilo/anthropic/claude-3-haiku", + "name": "Anthropic: Claude 3 Haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-03-07", + "last_updated": "2024-03-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "kilo/anthropic/claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "kilo/anthropic/claude-3.5-sonnet", + "name": "Anthropic: Claude 3.5 Sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 6.0, + "output": 30.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "kilo/anthropic/claude-3.7-sonnet", + "name": "Anthropic: Claude 3.7 Sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "kilo/anthropic/claude-3.7-sonnet:thinking", + "name": "Anthropic: Claude 3.7 Sonnet (thinking)", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-02-19", + "last_updated": "2025-02-24", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "kilo/anthropic/claude-haiku-4.5", + "name": "Anthropic: Claude Haiku 4.5", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "kilo/anthropic/claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "kilo/anthropic/claude-opus-4.1", + "name": "Anthropic: Claude Opus 4.1", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "kilo/anthropic/claude-opus-4.5", + "name": "Anthropic: Claude Opus 4.5", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "kilo/anthropic/claude-opus-4.6", + "name": "Anthropic: Claude Opus 4.6", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "kilo/anthropic/claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "kilo/anthropic/claude-sonnet-4.5", + "name": "Anthropic: Claude Sonnet 4.5", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "kilo/arcee-ai/trinity-large-preview:free", + "name": "Arcee AI: Trinity Large Preview (free)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-28", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131000, + "output": 26200 + } + }, + { + "id": "kilo/arcee-ai/trinity-mini", + "name": "Arcee AI: Trinity Mini", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.045, + "output": 0.15 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/arcee-ai/trinity-mini:free", + "name": "Arcee AI: Trinity Mini (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-28", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/baidu/ernie-4.5-21b-a3b", + "name": "Baidu: ERNIE 4.5 21B A3B", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 120000, + "output": 8000 + } + }, + { + "id": "kilo/baidu/ernie-4.5-21b-a3b-thinking", + "name": "Baidu: ERNIE 4.5 21B A3B Thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "kilo/baidu/ernie-4.5-300b-a47b", + "name": "Baidu: ERNIE 4.5 300B A47B ", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.28, + "output": 1.1 + }, + "limit": { + "context": 123000, + "output": 12000 + } + }, + { + "id": "kilo/baidu/ernie-4.5-vl-28b-a3b", + "name": "Baidu: ERNIE 4.5 VL 28B A3B", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.14, + "output": 0.56 + }, + "limit": { + "context": 30000, + "output": 8000 + } + }, + { + "id": "kilo/baidu/ernie-4.5-vl-424b-a47b", + "name": "Baidu: ERNIE 4.5 VL 424B A47B ", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2026-01", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.42, + "output": 1.25 + }, + "limit": { + "context": 123000, + "output": 16000 + } + }, + { + "id": "kilo/bytedance-seed/seed-1.6", + "name": "ByteDance Seed: Seed 1.6", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09", + "last_updated": "2025-09", + "modalities": { + "input": [ + "image", + "text", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "kilo/cognitivecomputations/dolphin-mistral-24b-venice-edition:free", + "name": "Venice: Uncensored (free)", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-07-09", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 6554 + } + }, + { + "id": "kilo/cohere/command-a", + "name": "Cohere: Command A", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 256000, + "output": 8192 + } + }, + { + "id": "kilo/cohere/command-r-08", + "name": "Cohere: Command R (08-2024)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "kilo/cohere/command-r-plus-08", + "name": "Cohere: Command R+ (08-2024)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "kilo/cohere/command-r7b-12", + "name": "Cohere: Command R7B (12-2024)", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-02-27", + "last_updated": "2024-02-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0375, + "output": 0.15 + }, + "limit": { + "context": 128000, + "output": 4000 + } + }, + { + "id": "kilo/deepseek/deepseek-chat", + "name": "DeepSeek: DeepSeek V3", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.15 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "kilo/deepseek/deepseek-chat-v3", + "name": "DeepSeek: DeepSeek V3 0324", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.19, + "output": 0.87, + "cache_read": 0.095 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "kilo/deepseek/deepseek-chat-v3.1", + "name": "DeepSeek: DeepSeek V3.1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.75 + }, + "limit": { + "context": 32768, + "output": 7168 + } + }, + { + "id": "kilo/deepseek/deepseek-r1", + "name": "DeepSeek: R1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 2.5 + }, + "limit": { + "context": 64000, + "output": 16000 + } + }, + { + "id": "kilo/deepseek/deepseek-r1-0528:free", + "name": "DeepSeek: R1 0528 (free)", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "kilo/deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek: R1 Distill Llama 70B", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-01-23", + "last_updated": "2025-01-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.11, + "cache_read": 0.015 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/deepseek/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek: R1 Distill Qwen 32B", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-01-01", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.29, + "output": 0.29 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "kilo/deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek: DeepSeek V3.1 Terminus", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.21, + "output": 0.79, + "cache_read": 0.13 + }, + "limit": { + "context": 163840, + "output": 32768 + } + }, + { + "id": "kilo/deepseek/deepseek-v3.1-terminus:exacto", + "name": "DeepSeek: DeepSeek V3.1 Terminus (exacto)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.21, + "output": 0.79, + "cache_read": 0.168 + }, + "limit": { + "context": 163840, + "output": 32768 + } + }, + { + "id": "kilo/deepseek/deepseek-v3.2", + "name": "DeepSeek: DeepSeek V3.2", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.38, + "cache_read": 0.125 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "kilo/deepseek/deepseek-v3.2-exp", + "name": "DeepSeek: DeepSeek V3.2 Exp", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-01", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 0.41 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "kilo/deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek: DeepSeek V3.2 Speciale", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 0.41, + "cache_read": 0.135 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "kilo/essentialai/rnj-1-instruct", + "name": "EssentialAI: Rnj 1 Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-05", + "last_updated": "2025-12-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 32768, + "output": 6554 + } + }, + { + "id": "kilo/google/gemini-2.0-flash-001", + "name": "Google: Gemini 2.0 Flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025, + "cache_write": 0.083333 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "kilo/google/gemini-2.0-flash-lite-001", + "name": "Google: Gemini 2.0 Flash Lite", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-11", + "last_updated": "2025-06-16", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.075, + "output": 0.3 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "kilo/google/gemini-2.5-flash", + "name": "Google: Gemini 2.5 Flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-17", + "last_updated": "2025-07-17", + "modalities": { + "input": [ + "image", + "text", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "cache_write": 0.083333 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "kilo/google/gemini-2.5-flash-lite", + "name": "Google: Gemini 2.5 Flash Lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0.083333 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "kilo/google/gemini-2.5-flash-lite-preview-09", + "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0.083333 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "kilo/google/gemini-2.5-flash-preview-09", + "name": "Google: Gemini 2.5 Flash Preview 09-2025", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "image", + "text", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "cache_write": 0.083333 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "kilo/google/gemini-2.5-pro", + "name": "Google: Gemini 2.5 Pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125, + "cache_write": 0.375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "kilo/google/gemini-2.5-pro-preview", + "name": "Google: Gemini 2.5 Pro Preview 06-05", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-05", + "last_updated": "2026-01", + "modalities": { + "input": [ + "image", + "text", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125, + "cache_write": 0.375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "kilo/google/gemini-2.5-pro-preview-05-06", + "name": "Google: Gemini 2.5 Pro Preview 05-06", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-05-06", + "last_updated": "2025-05-06", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125, + "cache_write": 0.375 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "kilo/google/gemini-3-flash-preview", + "name": "Google: Gemini 3 Flash Preview", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0, + "cache_read": 0.05, + "cache_write": 0.083333 + }, + "limit": { + "context": 1048576, + "output": 65535 + } + }, + { + "id": "kilo/google/gemini-3-pro-preview", + "name": "Google: Gemini 3 Pro Preview", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-18", + "last_updated": "2025-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2, + "cache_write": 0.375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "kilo/google/gemma-2-27b-it", + "name": "Google: Gemma 2 27B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-06-24", + "last_updated": "2024-06-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.65, + "output": 0.65 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "kilo/google/gemma-2-9b-it", + "name": "Google: Gemma 2 9B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-06-28", + "last_updated": "2024-06-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.09 + }, + "limit": { + "context": 8192, + "output": 1639 + } + }, + { + "id": "kilo/google/gemma-3-12b-it", + "name": "Google: Gemma 3 12B", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.1, + "cache_read": 0.015 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/google/gemma-3-12b-it:free", + "name": "Google: Gemma 3 12B (free)", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "kilo/google/gemma-3-27b-it", + "name": "Google: Gemma 3 27B", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.15, + "cache_read": 0.02 + }, + "limit": { + "context": 128000, + "output": 65536 + } + }, + { + "id": "kilo/google/gemma-3-27b-it:free", + "name": "Google: Gemma 3 27B (free)", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "kilo/google/gemma-3-4b-it", + "name": "Google: Gemma 3 4B", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01703, + "output": 0.068154 + }, + "limit": { + "context": 96000, + "output": 19200 + } + }, + { + "id": "kilo/google/gemma-3-4b-it:free", + "name": "Google: Gemma 3 4B (free)", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "kilo/google/gemma-3n-e2b-it:free", + "name": "Google: Gemma 3n 2B (free)", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "kilo/google/gemma-3n-e4b-it", + "name": "Google: Gemma 3n 4B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.04 + }, + "limit": { + "context": 32768, + "output": 6554 + } + }, + { + "id": "kilo/google/gemma-3n-e4b-it:free", + "name": "Google: Gemma 3n 4B (free)", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 2048 + } + }, + { + "id": "kilo/gryphe/mythomax-l2-13b", + "name": "MythoMax 13B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.06 + }, + "limit": { + "context": 4096, + "output": 4096 + } + }, + { + "id": "kilo/inception/mercury", + "name": "Inception: Mercury", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-26", + "last_updated": "2025-07-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "kilo/inception/mercury-coder", + "name": "Inception: Mercury Coder", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-02-26", + "last_updated": "2025-07-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "kilo/kilo/auto", + "name": "Kilo: Auto", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 1.0 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "kilo/kwaipilot/kat-coder-pro", + "name": "Kwaipilot: KAT-Coder-Pro V1", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-30", + "last_updated": "2025-10-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.207, + "output": 0.828, + "cache_read": 0.0414 + }, + "limit": { + "context": 256000, + "output": 128000 + } + }, + { + "id": "kilo/liquid/lfm-2.5-1.2b-instruct:free", + "name": "LiquidAI: LFM2.5-1.2B-Instruct (free)", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2026-01-20", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 6554 + } + }, + { + "id": "kilo/liquid/lfm-2.5-1.2b-thinking:free", + "name": "LiquidAI: LFM2.5-1.2B-Thinking (free)", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2026-01-20", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 6554 + } + }, + { + "id": "kilo/meituan/longcat-flash-chat", + "name": "Meituan: LongCat Flash Chat", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-08-30", + "last_updated": "2025-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.8, + "cache_read": 0.2 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "kilo/meta-llama/llama-3-70b-instruct", + "name": "Meta: Llama 3 70B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.51, + "output": 0.74 + }, + "limit": { + "context": 8192, + "output": 8000 + } + }, + { + "id": "kilo/meta-llama/llama-3-8b-instruct", + "name": "Meta: Llama 3 8B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-04-25", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.04 + }, + "limit": { + "context": 8192, + "output": 16384 + } + }, + { + "id": "kilo/meta-llama/llama-3.1-405b-instruct", + "name": "Meta: Llama 3.1 405B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-16", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 4.0, + "output": 4.0 + }, + "limit": { + "context": 131000, + "output": 26200 + } + }, + { + "id": "kilo/meta-llama/llama-3.1-70b-instruct", + "name": "Meta: Llama 3.1 70B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 0.4 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/meta-llama/llama-3.1-8b-instruct", + "name": "Meta: Llama 3.1 8B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.05 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "kilo/meta-llama/llama-3.2-11b-vision-instruct", + "name": "Meta: Llama 3.2 11B Vision Instruct", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.049, + "output": 0.049 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "kilo/meta-llama/llama-3.2-1b-instruct", + "name": "Meta: Llama 3.2 1B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.027, + "output": 0.2 + }, + "limit": { + "context": 60000, + "output": 12000 + } + }, + { + "id": "kilo/meta-llama/llama-3.2-3b-instruct", + "name": "Meta: Llama 3.2 3B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.02 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "kilo/meta-llama/llama-3.2-3b-instruct:free", + "name": "Meta: Llama 3.2 3B Instruct (free)", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/meta-llama/llama-3.3-70b-instruct", + "name": "Meta: Llama 3.3 70B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-08-01", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.32 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "kilo/meta-llama/llama-3.3-70b-instruct:free", + "name": "Meta: Llama 3.3 70B Instruct (free)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "kilo/meta-llama/llama-4-maverick", + "name": "Meta: Llama 4 Maverick", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-05", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 1048576, + "output": 16384 + } + }, + { + "id": "kilo/meta-llama/llama-4-scout", + "name": "Meta: Llama 4 Scout", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.3 + }, + "limit": { + "context": 327680, + "output": 16384 + } + }, + { + "id": "kilo/meta-llama/llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-04-18", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.06 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/meta-llama/llama-guard-4-12b", + "name": "Meta: Llama Guard 4 12B", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.18, + "output": 0.18 + }, + "limit": { + "context": 163840, + "output": 32768 + } + }, + { + "id": "kilo/microsoft/phi-4", + "name": "Microsoft: Phi 4", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.14 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "kilo/microsoft/wizardlm-2-8x22b", + "name": "WizardLM-2 8x22B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-04-24", + "last_updated": "2024-04-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.62, + "output": 0.62 + }, + "limit": { + "context": 65535, + "output": 8000 + } + }, + { + "id": "kilo/minimax/minimax-01", + "name": "MiniMax: MiniMax-01", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-01-15", + "last_updated": "2025-01-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.1 + }, + "limit": { + "context": 1000192, + "output": 1000192 + } + }, + { + "id": "kilo/minimax/minimax-m1", + "name": "MiniMax: MiniMax M1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.2 + }, + "limit": { + "context": 1000000, + "output": 40000 + } + }, + { + "id": "kilo/minimax/minimax-m2", + "name": "MiniMax: MiniMax M2", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-23", + "last_updated": "2025-10-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.255, + "output": 1.0, + "cache_read": 0.03 + }, + "limit": { + "context": 196608, + "output": 65536 + } + }, + { + "id": "kilo/minimax/minimax-m2.1", + "name": "MiniMax: MiniMax M2.1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 0.95, + "cache_read": 0.03 + }, + "limit": { + "context": 196608, + "output": 39322 + } + }, + { + "id": "kilo/minimax/minimax-m2.5", + "name": "MiniMax: MiniMax M2.5", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.029 + }, + "limit": { + "context": 196608, + "output": 39322 + } + }, + { + "id": "kilo/minimax/minimax-m2.5:free", + "name": "MiniMax: MiniMax M2.5 (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "kilo/mistralai/codestral", + "name": "Mistral: Codestral 2508", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 256000, + "output": 51200 + } + }, + { + "id": "kilo/mistralai/devstral", + "name": "Mistral: Devstral 2 2512", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-12", + "last_updated": "2025-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.22, + "cache_read": 0.025 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "kilo/mistralai/devstral-medium", + "name": "Mistral: Devstral Medium", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-10", + "last_updated": "2025-07-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/mistralai/devstral-small", + "name": "Mistral: Devstral Small 1.1", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-05-07", + "last_updated": "2025-07-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/mistralai/ministral-14b", + "name": "Mistral: Ministral 3 14B 2512", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 262144, + "output": 52429 + } + }, + { + "id": "kilo/mistralai/mistral-7b-instruct", + "name": "Mistral: Mistral 7B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-05-27", + "last_updated": "2024-05-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 32768, + "output": 4096 + } + }, + { + "id": "kilo/mistralai/mistral-7b-instruct-v0.1", + "name": "Mistral: Mistral 7B Instruct v0.1", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.11, + "output": 0.19 + }, + "limit": { + "context": 2824, + "output": 565 + } + }, + { + "id": "kilo/mistralai/mistral-7b-instruct-v0.3", + "name": "Mistral: Mistral 7B Instruct v0.3", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 32768, + "output": 4096 + } + }, + { + "id": "kilo/mistralai/mistral-large", + "name": "Mistral Large 2411", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-24", + "last_updated": "2024-11-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 6.0 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/mistralai/mistral-medium-3", + "name": "Mistral: Mistral Medium 3", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-05-07", + "last_updated": "2025-05-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/mistralai/mistral-medium-3.1", + "name": "Mistral: Mistral Medium 3.1", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/mistralai/mistral-nemo", + "name": "Mistral: Mistral Nemo", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-01", + "last_updated": "2024-07-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.04 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "kilo/mistralai/mistral-small-24b-instruct", + "name": "Mistral: Mistral Small 3", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.08 + }, + "limit": { + "context": 32768, + "output": 16384 + } + }, + { + "id": "kilo/mistralai/mistral-small-3.1-24b-instruct", + "name": "Mistral: Mistral Small 3.1 24B", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-17", + "last_updated": "2025-03-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.11, + "cache_read": 0.015 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/mistralai/mistral-small-3.1-24b-instruct:free", + "name": "Mistral: Mistral Small 3.1 24B (free)", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-17", + "last_updated": "2025-03-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 25600 + } + }, + { + "id": "kilo/mistralai/mistral-small-3.2-24b-instruct", + "name": "Mistral: Mistral Small 3.2 24B", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-20", + "last_updated": "2025-06-20", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.18, + "cache_read": 0.03 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/mistralai/mixtral-8x22b-instruct", + "name": "Mistral: Mixtral 8x22B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-04-17", + "last_updated": "2024-04-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 6.0 + }, + "limit": { + "context": 65536, + "output": 13108 + } + }, + { + "id": "kilo/mistralai/voxtral-small-24b", + "name": "Mistral: Voxtral Small 24B 2507", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "modalities": { + "input": [ + "text", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 32000, + "output": 6400 + } + }, + { + "id": "kilo/moonshotai/kimi-k2", + "name": "MoonshotAI: Kimi K2 0905", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.0, + "cache_read": 0.15 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/moonshotai/kimi-k2-0905:exacto", + "name": "MoonshotAI: Kimi K2 0905 (exacto)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5 + }, + "limit": { + "context": 262144, + "output": 52429 + } + }, + { + "id": "kilo/moonshotai/kimi-k2-thinking", + "name": "MoonshotAI: Kimi K2 Thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.75, + "cache_read": 0.2 + }, + "limit": { + "context": 262144, + "output": 65535 + } + }, + { + "id": "kilo/moonshotai/kimi-k2.5", + "name": "MoonshotAI: Kimi K2.5", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.23, + "output": 3.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "kilo/morph/morph-v3-fast", + "name": "Morph: Morph V3 Fast", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 1.2 + }, + "limit": { + "context": 81920, + "output": 38000 + } + }, + { + "id": "kilo/morph/morph-v3-large", + "name": "Morph: Morph V3 Large", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.9, + "output": 1.9 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "kilo/nex-agi/deepseek-v3.1-nex-n1", + "name": "Nex AGI: DeepSeek V3.1 Nex N1", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-01", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 131072, + "output": 163840 + } + }, + { + "id": "kilo/nousresearch/deephermes-3-mistral-24b-preview", + "name": "Nous: DeepHermes 3 Mistral 24B Preview", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.1, + "cache_read": 0.01 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "kilo/nousresearch/hermes-2-pro-llama-3-8b", + "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-05-27", + "last_updated": "2024-06-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.14, + "output": 0.14 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "kilo/nousresearch/hermes-3-llama-3.1-405b", + "name": "Nous: Hermes 3 405B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-08-16", + "last_updated": "2024-08-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 1.0 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "kilo/nousresearch/hermes-3-llama-3.1-405b:free", + "name": "Nous: Hermes 3 405B Instruct (free)", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-08-16", + "last_updated": "2024-08-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/nousresearch/hermes-4-405b", + "name": "Nous: Hermes 4 405B", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-08-25", + "last_updated": "2025-08-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.0 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/nousresearch/hermes-4-70b", + "name": "Nous: Hermes 4 70B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-25", + "last_updated": "2025-08-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.11, + "output": 0.38, + "cache_read": 0.055 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/nvidia/llama-3.1-nemotron-70b-instruct", + "name": "NVIDIA: Llama 3.1 Nemotron 70B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-10-12", + "last_updated": "2024-10-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.2, + "output": 1.2 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "kilo/nvidia/llama-3.1-nemotron-ultra-253b-v1", + "name": "NVIDIA: Llama 3.1 Nemotron Ultra 253B v1", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2024-07-01", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.8 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/nvidia/llama-3.3-nemotron-super-49b-v1.5", + "name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-16", + "last_updated": "2025-03-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/nvidia/nemotron-3-nano-30b-a3b", + "name": "NVIDIA: Nemotron 3 Nano 30B A3B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2024-12", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.2 + }, + "limit": { + "context": 262144, + "output": 52429 + } + }, + { + "id": "kilo/nvidia/nemotron-3-nano-30b-a3b:free", + "name": "NVIDIA: Nemotron 3 Nano 30B A3B (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-14", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 51200 + } + }, + { + "id": "kilo/nvidia/nemotron-nano-12b-v2-vl", + "name": "NVIDIA: Nemotron Nano 12B 2 VL", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-10-28", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "image", + "text", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/nvidia/nemotron-nano-12b-v2-vl:free", + "name": "NVIDIA: Nemotron Nano 12B 2 VL (free)", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-28", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "image", + "text", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "kilo/nvidia/nemotron-nano-9b-v2", + "name": "NVIDIA: Nemotron Nano 9B V2", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-18", + "last_updated": "2025-08-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.16 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/nvidia/nemotron-nano-9b-v2:free", + "name": "NVIDIA: Nemotron Nano 9B V2 (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-05", + "last_updated": "2025-08-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 25600 + } + }, + { + "id": "kilo/openai/chatgpt-4o", + "name": "OpenAI: ChatGPT-4o", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-08-08", + "last_updated": "2024-08-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 15.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "kilo/openai/gpt-3.5-turbo", + "name": "OpenAI: GPT-3.5 Turbo (older v0613)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2023-06-13", + "last_updated": "2023-06-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 4095, + "output": 4096 + } + }, + { + "id": "kilo/openai/gpt-3.5-turbo-instruct", + "name": "OpenAI: GPT-3.5 Turbo Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2023-03-01", + "last_updated": "2023-09-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.5, + "output": 2.0 + }, + "limit": { + "context": 4095, + "output": 4096 + } + }, + { + "id": "kilo/openai/gpt-4", + "name": "OpenAI: GPT-4", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2023-03-14", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 30.0, + "output": 60.0 + }, + "limit": { + "context": 8191, + "output": 4096 + } + }, + { + "id": "kilo/openai/gpt-4-turbo", + "name": "OpenAI: GPT-4 Turbo", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2023-09-13", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 30.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "kilo/openai/gpt-4.1", + "name": "OpenAI: GPT-4.1", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "kilo/openai/gpt-4.1-mini", + "name": "OpenAI: GPT-4.1 Mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "kilo/openai/gpt-4.1-nano", + "name": "OpenAI: GPT-4.1 Nano", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-14", + "last_updated": "2025-04-15", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "kilo/openai/gpt-4o", + "name": "OpenAI: GPT-4o (2024-11-20)", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-20", + "last_updated": "2024-11-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 10.0, + "cache_read": 1.25 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "kilo/openai/gpt-4o-mini", + "name": "OpenAI: GPT-4o-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "kilo/openai/gpt-4o-mini-search-preview", + "name": "OpenAI: GPT-4o-mini Search Preview", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-01", + "last_updated": "2025-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "kilo/openai/gpt-4o:extended", + "name": "OpenAI: GPT-4o (extended)", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 6.0, + "output": 18.0 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "kilo/openai/gpt-5", + "name": "OpenAI: GPT-5", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5-chat", + "name": "OpenAI: GPT-5 Chat", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "kilo/openai/gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5-mini", + "name": "OpenAI: GPT-5 Mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5-nano", + "name": "OpenAI: GPT-5 Nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 120.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5.1", + "name": "OpenAI: GPT-5.1", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5.1-chat", + "name": "OpenAI: GPT-5.1 Chat", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "kilo/openai/gpt-5.1-codex", + "name": "OpenAI: GPT-5.1-Codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5.1-codex-max", + "name": "OpenAI: GPT-5.1-Codex-Max", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1-Codex-Mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 100000 + } + }, + { + "id": "kilo/openai/gpt-5.2", + "name": "OpenAI: GPT-5.2", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5.2-chat", + "name": "OpenAI: GPT-5.2 Chat", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "kilo/openai/gpt-5.2-codex", + "name": "OpenAI: GPT-5.2-Codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-5.2-pro", + "name": "OpenAI: GPT-5.2 Pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 21.0, + "output": 168.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "kilo/openai/gpt-oss-120b", + "name": "OpenAI: gpt-oss-120b", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.039, + "output": 0.19 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/openai/gpt-oss-120b:exacto", + "name": "OpenAI: gpt-oss-120b (exacto)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.039, + "output": 0.19 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/openai/gpt-oss-120b:free", + "name": "OpenAI: gpt-oss-120b (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/openai/gpt-oss-20b", + "name": "OpenAI: gpt-oss-20b", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.14 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/openai/gpt-oss-20b:free", + "name": "OpenAI: gpt-oss-20b (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/openai/gpt-oss-safeguard-20b", + "name": "OpenAI: gpt-oss-safeguard-20b", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-29", + "last_updated": "2025-10-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.075, + "output": 0.3, + "cache_read": 0.037 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "kilo/openai/o1", + "name": "OpenAI: o1", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-12-05", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 60.0, + "cache_read": 7.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "kilo/openai/o1-pro", + "name": "OpenAI: o1-pro", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": false, + "release_date": "2025-03-19", + "last_updated": "2025-03-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 150.0, + "output": 600.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "kilo/openai/o3", + "name": "OpenAI: o3", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-16", + "last_updated": "2026-01", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "kilo/openai/o3-deep-research", + "name": "OpenAI: o3 Deep Research", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2024-06-26", + "last_updated": "2025-06-27", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 40.0, + "cache_read": 2.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "kilo/openai/o3-mini", + "name": "OpenAI: o3 Mini", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-12-20", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "kilo/openai/o3-mini-high", + "name": "OpenAI: o3 Mini High", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "kilo/openai/o3-pro", + "name": "OpenAI: o3 Pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-16", + "last_updated": "2025-06-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 20.0, + "output": 80.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "kilo/openai/o4-mini", + "name": "OpenAI: o4 Mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "kilo/openai/o4-mini-deep-research", + "name": "OpenAI: o4 Mini Deep Research", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2024-06-26", + "last_updated": "2025-06-27", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "kilo/openrouter/aurora-alpha", + "name": "Aurora Alpha (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-09", + "last_updated": "2026-02-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 50000 + } + }, + { + "id": "kilo/perplexity/sonar", + "name": "Perplexity: Sonar", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 1.0 + }, + "limit": { + "context": 127072, + "output": 25415 + } + }, + { + "id": "kilo/perplexity/sonar-deep-research", + "name": "Perplexity: Sonar Deep Research", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0 + }, + "limit": { + "context": 128000, + "output": 25600 + } + }, + { + "id": "kilo/perplexity/sonar-pro", + "name": "Perplexity: Sonar Pro", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0 + }, + "limit": { + "context": 200000, + "output": 8000 + } + }, + { + "id": "kilo/perplexity/sonar-reasoning-pro", + "name": "Perplexity: Sonar Reasoning Pro", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0 + }, + "limit": { + "context": 128000, + "output": 25600 + } + }, + { + "id": "kilo/prime-intellect/intellect-3", + "name": "Prime Intellect: INTELLECT-3", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-26", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.1 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/qwen/qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.12, + "output": 0.39 + }, + "limit": { + "context": 32768, + "output": 16384 + } + }, + { + "id": "kilo/qwen/qwen-2.5-7b-instruct", + "name": "Qwen: Qwen2.5 7B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.1 + }, + "limit": { + "context": 32768, + "output": 6554 + } + }, + { + "id": "kilo/qwen/qwen-2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-11-11", + "last_updated": "2024-11-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.11, + "cache_read": 0.015 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen-2.5-vl-7b-instruct", + "name": "Qwen: Qwen2.5-VL 7B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-08-28", + "last_updated": "2024-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 32768, + "output": 6554 + } + }, + { + "id": "kilo/qwen/qwen-max", + "name": "Qwen: Qwen-Max ", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-04-03", + "last_updated": "2025-01-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.6, + "output": 6.4, + "cache_read": 0.32 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "kilo/qwen/qwen-plus", + "name": "Qwen: Qwen-Plus", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-01-25", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 1.2, + "cache_read": 0.08 + }, + "limit": { + "context": 1000000, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen-turbo", + "name": "Qwen: Qwen-Turbo", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-01", + "last_updated": "2025-07-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.2, + "cache_read": 0.01 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "kilo/qwen/qwen-vl-max", + "name": "Qwen: Qwen VL Max", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-04-08", + "last_updated": "2025-08-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 3.2 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen-vl-plus", + "name": "Qwen: Qwen VL Plus", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-01-25", + "last_updated": "2025-08-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.21, + "output": 0.63, + "cache_read": 0.042 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "kilo/qwen/qwen2.5-coder-7b-instruct", + "name": "Qwen: Qwen2.5 Coder 7B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-09-17", + "last_updated": "2024-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.09 + }, + "limit": { + "context": 32768, + "output": 6554 + } + }, + { + "id": "kilo/qwen/qwen2.5-vl-32b-instruct", + "name": "Qwen: Qwen2.5 VL 32B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-24", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.22, + "cache_read": 0.025 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "kilo/qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen: Qwen2.5 VL 72B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-02-01", + "last_updated": "2025-02-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen3-14b", + "name": "Qwen: Qwen3 14B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.22, + "cache_read": 0.025 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "kilo/qwen/qwen3-235b-a22b", + "name": "Qwen: Qwen3 235B A22B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.15 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "kilo/qwen/qwen3-235b-a22b-thinking", + "name": "Qwen: Qwen3 235B A22B Thinking 2507", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/qwen/qwen3-30b-a3b", + "name": "Qwen: Qwen3 30B A3B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.22, + "cache_read": 0.03 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "kilo/qwen/qwen3-30b-a3b-instruct", + "name": "Qwen: Qwen3 30B A3B Instruct 2507", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.33, + "cache_read": 0.04 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "kilo/qwen/qwen3-30b-a3b-thinking", + "name": "Qwen: Qwen3 30B A3B Thinking 2507", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.051, + "output": 0.34 + }, + "limit": { + "context": 32768, + "output": 6554 + } + }, + { + "id": "kilo/qwen/qwen3-32b", + "name": "Qwen: Qwen3 32B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-01", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.24, + "cache_read": 0.04 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "kilo/qwen/qwen3-4b", + "name": "Qwen: Qwen3 4B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-29", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0715, + "output": 0.273 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "kilo/qwen/qwen3-4b:free", + "name": "Qwen: Qwen3 4B (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-30", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 40960, + "output": 8192 + } + }, + { + "id": "kilo/qwen/qwen3-8b", + "name": "Qwen: Qwen3 8B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.05 + }, + "limit": { + "context": 32000, + "output": 8192 + } + }, + { + "id": "kilo/qwen/qwen3-coder", + "name": "Qwen: Qwen3 Coder 480B A35B", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 1.0, + "cache_read": 0.022 + }, + "limit": { + "context": 262144, + "output": 52429 + } + }, + { + "id": "kilo/qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-31", + "last_updated": "2025-07-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.27 + }, + "limit": { + "context": 160000, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen3-coder-flash", + "name": "Qwen: Qwen3 Coder Flash", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.5, + "cache_read": 0.06 + }, + "limit": { + "context": 1000000, + "output": 65536 + } + }, + { + "id": "kilo/qwen/qwen3-coder-next", + "name": "Qwen: Qwen3 Coder Next", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-02", + "last_updated": "2026-02-08", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.3, + "cache_read": 0.035 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "kilo/qwen/qwen3-coder-plus", + "name": "Qwen: Qwen3 Coder Plus", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1000000, + "output": 65536 + } + }, + { + "id": "kilo/qwen/qwen3-coder:exacto", + "name": "Qwen: Qwen3 Coder 480B A35B (exacto)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "kilo/qwen/qwen3-coder:free", + "name": "Qwen: Qwen3 Coder 480B A35B (free)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "kilo/qwen/qwen3-max", + "name": "Qwen: Qwen3 Max", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.2, + "output": 6.0, + "cache_read": 0.24 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "kilo/qwen/qwen3-max-thinking", + "name": "Qwen: Qwen3 Max Thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-23", + "last_updated": "2026-01-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.2, + "output": 6.0 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "kilo/qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen: Qwen3 Next 80B A3B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 1.1 + }, + "limit": { + "context": 262144, + "output": 52429 + } + }, + { + "id": "kilo/qwen/qwen3-next-80b-a3b-instruct:free", + "name": "Qwen: Qwen3 Next 80B A3B Instruct (free)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 52429 + } + }, + { + "id": "kilo/qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen: Qwen3 Next 80B A3B Thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 1.2 + }, + "limit": { + "context": 128000, + "output": 25600 + } + }, + { + "id": "kilo/qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen: Qwen3 VL 235B A22B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-23", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.88, + "cache_read": 0.11 + }, + "limit": { + "context": 262144, + "output": 52429 + } + }, + { + "id": "kilo/qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen: Qwen3 VL 235B A22B Thinking", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen3-vl-30b-a3b-instruct", + "name": "Qwen: Qwen3 VL 30B A3B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-05", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.52 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen3-vl-30b-a3b-thinking", + "name": "Qwen: Qwen3 VL 30B A3B Thinking", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-11", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen3-vl-32b-instruct", + "name": "Qwen: Qwen3 VL 32B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.104, + "output": 0.416 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen3-vl-8b-instruct", + "name": "Qwen: Qwen3 VL 8B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.5 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen3-vl-8b-thinking", + "name": "Qwen: Qwen3 VL 8B Thinking", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.117, + "output": 1.365 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "kilo/qwen/qwen3.5-397b-a17b", + "name": "Qwen: Qwen3.5 397B A17B", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.6, + "output": 3.6 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "kilo/qwen/qwen3.5-plus-02-15", + "name": "Qwen: Qwen3.5 Plus 2026-02-15", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.4 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "kilo/qwen/qwq-32b", + "name": "Qwen: QwQ 32B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-28", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.4 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "kilo/stepfun/step-3.5-flash", + "name": "StepFun: Step 3.5 Flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "kilo/stepfun/step-3.5-flash:free", + "name": "StepFun: Step 3.5 Flash (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "kilo/tencent/hunyuan-a13b-instruct", + "name": "Tencent: Hunyuan A13B Instruct", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/tngtech/deepseek-r1t-chimera", + "name": "TNG: DeepSeek R1T Chimera", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.15 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "kilo/tngtech/deepseek-r1t2-chimera", + "name": "TNG: DeepSeek R1T2 Chimera", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-08", + "last_updated": "2025-07-08", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.85, + "cache_read": 0.125 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "kilo/tngtech/tng-r1t-chimera", + "name": "TNG: R1T Chimera", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-26", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.85, + "cache_read": 0.125 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "kilo/writer/palmyra-x5", + "name": "Writer: Palmyra X5", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.6, + "output": 6.0 + }, + "limit": { + "context": 1040000, + "output": 8192 + } + }, + { + "id": "kilo/x-ai/grok-3", + "name": "xAI: Grok 3", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/x-ai/grok-3-beta", + "name": "xAI: Grok 3 Beta", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/x-ai/grok-3-mini", + "name": "xAI: Grok 3 Mini", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/x-ai/grok-3-mini-beta", + "name": "xAI: Grok 3 Mini Beta", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + }, + "limit": { + "context": 131072, + "output": 26215 + } + }, + { + "id": "kilo/x-ai/grok-4", + "name": "xAI: Grok 4", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 256000, + "output": 51200 + } + }, + { + "id": "kilo/x-ai/grok-4-fast", + "name": "xAI: Grok 4 Fast", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-19", + "last_updated": "2025-08-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "kilo/x-ai/grok-4.1-fast", + "name": "xAI: Grok 4.1 Fast", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "kilo/x-ai/grok-code-fast-1", + "name": "xAI: Grok Code Fast 1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + }, + "limit": { + "context": 256000, + "output": 10000 + } + }, + { + "id": "kilo/xiaomi/mimo-v2-flash", + "name": "Xiaomi: MiMo-V2-Flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-14", + "last_updated": "2025-12-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.29, + "cache_read": 0.045 + }, + "limit": { + "context": 262144, + "output": 52429 + } + }, + { + "id": "kilo/z-ai/glm-4.5", + "name": "Z.ai: GLM 4.5", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.35, + "output": 1.55, + "cache_read": 0.175 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "kilo/z-ai/glm-4.5-air", + "name": "Z.ai: GLM 4.5 Air", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.85, + "cache_read": 0.025 + }, + "limit": { + "context": 131072, + "output": 98304 + } + }, + { + "id": "kilo/z-ai/glm-4.5-air:free", + "name": "Z.ai: GLM 4.5 Air (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 96000 + } + }, + { + "id": "kilo/z-ai/glm-4.5v", + "name": "Z.ai: GLM 4.5V", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-11", + "last_updated": "2025-08-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.8, + "cache_read": 0.11 + }, + "limit": { + "context": 65536, + "output": 16384 + } + }, + { + "id": "kilo/z-ai/glm-4.6", + "name": "Z.ai: GLM 4.6", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.35, + "output": 1.5, + "cache_read": 0.175 + }, + "limit": { + "context": 202752, + "output": 65536 + } + }, + { + "id": "kilo/z-ai/glm-4.6:exacto", + "name": "Z.ai: GLM 4.6 (exacto)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.44, + "output": 1.76, + "cache_read": 0.11 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "kilo/z-ai/glm-4.6v", + "name": "Z.ai: GLM 4.6V", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-30", + "last_updated": "2026-01-10", + "modalities": { + "input": [ + "image", + "text", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "kilo/z-ai/glm-4.7", + "name": "Z.ai: GLM 4.7", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.5, + "cache_read": 0.2 + }, + "limit": { + "context": 202752, + "output": 65535 + } + }, + { + "id": "kilo/z-ai/glm-4.7-flash", + "name": "Z.ai: GLM 4.7 Flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.4, + "cache_read": 0.01 + }, + "limit": { + "context": 202752, + "output": 40551 + } + }, + { + "id": "kilo/z-ai/glm-5", + "name": "Z.ai: GLM 5", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 2.55 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "kilo/z-ai/glm-5:free", + "name": "Z.ai: GLM 5 (free)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0 + }, + "limit": { + "context": 202800, + "output": 131072 + } + }, + { + "id": "kimi-for-coding/k2p5", + "name": "Kimi K2.5", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "kimi-for-coding/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "kuae-cloud-coding-plan/GLM-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "lmstudio/openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "lmstudio/qwen/qwen3-30b-a3b", + "name": "Qwen3 30B A3B 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "lmstudio/qwen/qwen3-coder-30b", + "name": "Qwen3 Coder 30B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "lucidquery/lucidnova-rf1-100b", + "name": "LucidNova RF1 100B", + "family": "nova", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-09-16", + "release_date": "2024-12-28", + "last_updated": "2025-09-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 5.0 + }, + "limit": { + "context": 120000, + "output": 8000 + } + }, + { + "id": "lucidquery/lucidquery-nexus-coder", + "name": "LucidQuery Nexus Coder", + "family": "lucid", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 5.0 + }, + "limit": { + "context": 250000, + "output": 60000 + } + }, + { + "id": "meganova/MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.28, + "output": 1.2 + }, + "limit": { + "context": 196608, + "output": 131072 + } + }, + { + "id": "meganova/MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "meganova/Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen2.5 VL 32B Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "meganova/Qwen/Qwen3-235B-A22B-Instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.6 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "meganova/Qwen/Qwen3.5-Plus", + "name": "Qwen3.5 Plus", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-02", + "last_updated": "2026-02", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.4 + }, + "limit": { + "context": 1000000, + "output": 65536 + } + }, + { + "id": "meganova/XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo V2 Flash", + "family": "mimo", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 262144, + "output": 32000 + } + }, + { + "id": "meganova/deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1 0528", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 2.15 + }, + "limit": { + "context": 163840, + "output": 64000 + } + }, + { + "id": "meganova/deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3 0324", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.88 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "meganova/deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-25", + "last_updated": "2025-08-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "meganova/deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.26, + "output": 0.38 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "meganova/deepseek-ai/DeepSeek-V3.2-Exp", + "name": "DeepSeek V3.2 Exp", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-10", + "last_updated": "2025-10-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 0.4 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "meganova/meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "meganova/mistralai/Mistral-Nemo-Instruct", + "name": "Mistral Nemo Instruct 2407", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.04 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "meganova/mistralai/Mistral-Small-3.2-24B-Instruct", + "name": "Mistral Small 3.2 24B Instruct", + "family": "mistral-small", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "meganova/moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.6 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "meganova/moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2026-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.45, + "output": 2.8 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "meganova/zai-org/GLM-4.6", + "name": "GLM-4.6", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.45, + "output": 1.9 + }, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "meganova/zai-org/GLM-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "meganova/zai-org/GLM-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 2.56 + }, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "meta-llama/cerebras-llama-4-maverick-17b-128e-instruct", + "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "meta-llama/cerebras-llama-4-scout-17b-16e-instruct", + "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "meta-llama/groq-llama-4-maverick-17b-128e-instruct", + "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "meta-llama/llama-3.3-8b-instruct", + "name": "Llama-3.3-8B-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "meta-llama/llama-4-scout-17b-16e-instruct-fp8", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "minimax-cn-coding-plan/MiniMax-M2", + "name": "MiniMax-M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 196608, + "output": 128000 + } + }, + { + "id": "minimax-cn-coding-plan/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax-cn-coding-plan/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax-cn-coding-plan/MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax-cn/MiniMax-M2", + "name": "MiniMax-M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 196608, + "output": 128000 + } + }, + { + "id": "minimax-cn/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax-cn/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax-cn/MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax-coding-plan/MiniMax-M2", + "name": "MiniMax-M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 196608, + "output": 128000 + } + }, + { + "id": "minimax-coding-plan/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax-coding-plan/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax-coding-plan/MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax/MiniMax-M2", + "name": "MiniMax-M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 196608, + "output": 128000 + } + }, + { + "id": "minimax/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "minimax/MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "mistralai/codestral", + "name": "Codestral", + "family": "codestral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 256000, + "output": 4096 + } + }, + { + "id": "mistralai/devstral", + "name": "Devstral 2", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "mistralai/devstral-medium", + "name": "Devstral 2", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "mistralai/devstral-small", + "name": "Devstral Small", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "mistralai/labs-devstral-small", + "name": "Devstral Small 2", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "mistralai/magistral-medium", + "name": "Magistral Medium", + "family": "magistral-medium", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 5.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "mistralai/magistral-small", + "name": "Magistral Small", + "family": "magistral-small", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 1.5 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "mistralai/ministral-3b", + "name": "Ministral 3B", + "family": "ministral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.04 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "mistralai/ministral-8b", + "name": "Ministral 8B", + "family": "ministral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "mistralai/mistral-embed", + "name": "Mistral Embed", + "family": "mistral-embed", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.0 + }, + "limit": { + "context": 8000, + "output": 3072 + } + }, + { + "id": "mistralai/mistral-large", + "name": "Mistral Large 2.1", + "family": "mistral-large", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 6.0 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "mistralai/mistral-medium", + "name": "Mistral Medium", + "family": "mistral-medium", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "mistralai/mistral-nemo", + "name": "Mistral Nemo", + "family": "mistral-nemo", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "mistralai/mistral-small", + "name": "Mistral Small", + "family": "mistral-small", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2024-09-01", + "last_updated": "2024-09-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "mistralai/open-mistral-7b", + "name": "Mistral 7B", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2023-09-27", + "last_updated": "2023-09-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.25 + }, + "limit": { + "context": 8000, + "output": 8000 + } + }, + { + "id": "mistralai/open-mixtral-8x22b", + "name": "Mixtral 8x22B", + "family": "mixtral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 6.0 + }, + "limit": { + "context": 64000, + "output": 64000 + } + }, + { + "id": "mistralai/open-mixtral-8x7b", + "name": "Mixtral 8x7B", + "family": "mixtral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-01", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 0.7 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "mistralai/pixtral-12b", + "name": "Pixtral 12B", + "family": "pixtral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "mistralai/pixtral-large", + "name": "Pixtral Large", + "family": "pixtral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 6.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "moark/GLM-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 3.5, + "output": 14.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "moark/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.1, + "output": 8.4 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "modelscope/Qwen/Qwen3-235B-A22B-Instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "modelscope/Qwen/Qwen3-235B-A22B-Thinking", + "name": "Qwen3-235B-A22B-Thinking-2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "modelscope/Qwen/Qwen3-30B-A3B-Instruct", + "name": "Qwen3 30B A3B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "modelscope/Qwen/Qwen3-30B-A3B-Thinking", + "name": "Qwen3 30B A3B Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "modelscope/Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "modelscope/ZhipuAI/GLM-4.5", + "name": "GLM-4.5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 98304 + } + }, + { + "id": "modelscope/ZhipuAI/GLM-4.6", + "name": "GLM-4.6", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 202752, + "output": 98304 + } + }, + { + "id": "moonshotai-cn/kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "moonshotai-cn/kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "moonshotai-cn/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "moonshotai-cn/kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.15, + "output": 8.0, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "moonshotai-cn/kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.4, + "output": 10.0, + "cache_read": 0.6 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "moonshotai-cn/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0, + "cache_read": 0.1 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "moonshotai/kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "moonshotai/kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "moonshotai/kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.15, + "output": 8.0, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "moonshotai/kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.4, + "output": 10.0, + "cache_read": 0.6 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0, + "cache_read": 0.1 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "morph/auto", + "name": "Auto", + "family": "auto", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.85, + "output": 1.55 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "morph/morph-v3-fast", + "name": "Morph v3 Fast", + "family": "morph", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 1.2 + }, + "limit": { + "context": 16000, + "output": 16000 + } + }, + { + "id": "morph/morph-v3-large", + "name": "Morph v3 Large", + "family": "morph", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.9, + "output": 1.9 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "nano-gpt/deepseek/deepseek-r1", + "name": "Deepseek R1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-01-20", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/deepseek/deepseek-v3.2:thinking", + "name": "Deepseek V3.2 Thinking", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/meta-llama/llama-4-maverick", + "name": "Llama 4 Maverick", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/minimax/minimax-m2.1", + "name": "Minimax M2.1", + "family": "minimax", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "nano-gpt/minimax/minimax-m2.5-official", + "name": "MiniMax M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "nano-gpt/mistralai/devstral-2-123b-instruct", + "name": "Devstral 2 123b Instruct 2512", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-11", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nano-gpt/mistralai/ministral-14b-instruct", + "name": "Ministral 14b Instruct 2512", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nano-gpt/mistralai/mistral-large-3-675b-instruct", + "name": "Mistral Large 3 675b Instruct 2512", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-02", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nano-gpt/moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nano-gpt/moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "nano-gpt/moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-26", + "last_updated": "2026-01-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.9 + }, + "limit": { + "context": 256000, + "output": 65536 + } + }, + { + "id": "nano-gpt/moonshotai/kimi-k2.5-thinking", + "name": "Kimi K2.5 Thinking", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-26", + "last_updated": "2026-01-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.9 + }, + "limit": { + "context": 256000, + "output": 65536 + } + }, + { + "id": "nano-gpt/nousresearch/hermes-4-405b:thinking", + "name": "Hermes 4 405b Thinking", + "family": "hermes", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2024-08-13", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/nvidia/llama-3_3-nemotron-super-49b-v1_5", + "name": "Llama 3 3 Nemotron Super 49B V1 5", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-08", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/openai/gpt-oss-120b", + "name": "GPT Oss 120b", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-06-23", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/qwen/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-07-01", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 262144, + "output": 8192 + } + }, + { + "id": "nano-gpt/qwen/qwen3-coder", + "name": "Qwen3 Coder", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 106000, + "output": 8192 + } + }, + { + "id": "nano-gpt/qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.6 + }, + "limit": { + "context": 258000, + "output": 8192 + } + }, + { + "id": "nano-gpt/qwen/qwen3.5-397b-a17b-thinking", + "name": "Qwen3.5 397B A17B Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.6 + }, + "limit": { + "context": 258000, + "output": 8192 + } + }, + { + "id": "nano-gpt/qwen/qwen3.5-plus", + "name": "Qwen3.5 Plus", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.4 + }, + "limit": { + "context": 983600, + "output": 8192 + } + }, + { + "id": "nano-gpt/qwen/qwen3.5-plus-thinking", + "name": "Qwen3.5 Plus Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.4 + }, + "limit": { + "context": 983600, + "output": 8192 + } + }, + { + "id": "nano-gpt/zai-org/glm-4.5-air", + "name": "GLM 4.5 Air", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/zai-org/glm-4.5-air:thinking", + "name": "GLM 4.5 Air Thinking", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-07", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/zai-org/glm-4.6", + "name": "GLM 4.6", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-11-15", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "nano-gpt/zai-org/glm-4.6:thinking", + "name": "GLM 4.6 Thinking", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-07", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/zai-org/glm-4.7", + "name": "GLM 4.7", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 204800, + "output": 8192 + } + }, + { + "id": "nano-gpt/zai-org/glm-4.7:thinking", + "name": "GLM 4.7 Thinking", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-07", + "last_updated": "2025-12-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nano-gpt/zai-org/glm-5", + "name": "GLM 5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.8, + "output": 2.56 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "nano-gpt/zai-org/glm-5-original", + "name": "GLM 5 Original", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.8, + "output": 2.56 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "nano-gpt/zai-org/glm-5-original:thinking", + "name": "GLM 5 Original Thinking", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.8, + "output": 2.56 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "nano-gpt/zai-org/glm-5:thinking", + "name": "GLM 5 Thinking", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.8, + "output": 2.56 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "nebius/BAAI/bge-en-icl", + "name": "BGE-ICL", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-06", + "release_date": "2024-07-30", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 0 + } + }, + { + "id": "nebius/BAAI/bge-multilingual-gemma2", + "name": "bge-multilingual-gemma2", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-06", + "release_date": "2024-07-30", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 0 + } + }, + { + "id": "nebius/MiniMaxAI/minimax-m2.1", + "name": "MiniMax-M2.1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2026-02-01", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/NousResearch/hermes-4-405b", + "name": "Hermes-4-405B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/NousResearch/hermes-4-70b", + "name": "Hermes-4-70B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/PrimeIntellect/intellect-3", + "name": "INTELLECT-3", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2026-01-25", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.1, + "cache_read": 0.02, + "cache_write": 0.25 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/black-forest-labs/flux-dev", + "name": "FLUX.1-dev", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-07", + "release_date": "2024-08-01", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 77, + "output": 0 + } + }, + { + "id": "nebius/black-forest-labs/flux-schnell", + "name": "FLUX.1-schnell", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-07", + "release_date": "2024-08-01", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 77, + "output": 0 + } + }, + { + "id": "nebius/deepseek-ai/deepseek-r1", + "name": "DeepSeek-R1-0528", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2026-01-15", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.8, + "output": 2.4, + "cache_read": 0.08, + "cache_write": 1.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "nebius/deepseek-ai/deepseek-r1-0528-fast", + "name": "DeepSeek R1 0528 Fast", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 6.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nebius/deepseek-ai/deepseek-v3", + "name": "DeepSeek-V3-0324", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-03-24", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 0.05, + "cache_write": 0.1875 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/deepseek-ai/deepseek-v3-0324-fast", + "name": "DeepSeek-V3-0324 (Fast)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-03-24", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.75, + "output": 2.25, + "cache_read": 0.075, + "cache_write": 0.28125 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/deepseek-ai/deepseek-v3.2", + "name": "DeepSeek-V3.2", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.45, + "cache_read": 0.03, + "cache_write": 0.375 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/google/gemma-2-2b-it", + "name": "Gemma-2-2b-it", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-07-31", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 + }, + "limit": { + "context": 8192, + "output": 4096 + } + }, + { + "id": "nebius/google/gemma-2-9b-it-fast", + "name": "Gemma-2-9b-it (Fast)", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-06-27", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.09, + "cache_read": 0.003, + "cache_write": 0.0375 + }, + "limit": { + "context": 8192, + "output": 4096 + } + }, + { + "id": "nebius/google/gemma-3-27b-it", + "name": "Gemma-3-27b-it", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/google/gemma-3-27b-it-fast", + "name": "Gemma-3-27b-it (Fast)", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.6, + "cache_read": 0.02, + "cache_write": 0.25 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/intfloat/e5-mistral-7b-instruct", + "name": "e5-mistral-7b-instruct", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2023-12", + "release_date": "2024-01-01", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 0 + } + }, + { + "id": "nebius/meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-12-05", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/meta-llama/llama-3.3-70b-instruct-fast", + "name": "Llama-3.3-70B-Instruct (Fast)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-12-05", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.75, + "cache_read": 0.025, + "cache_write": 0.31 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/meta-llama/llama-guard-3-8b", + "name": "Llama-Guard-3-8B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-04", + "release_date": "2024-04-18", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 + }, + "limit": { + "context": 8192, + "output": 1024 + } + }, + { + "id": "nebius/meta-llama/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-07-23", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nebius/meta-llama/meta-llama-3.1-8b-instruct-fast", + "name": "Meta-Llama-3.1-8B-Instruct (Fast)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-07-23", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.09, + "cache_read": 0.003, + "cache_write": 0.03 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nebius/moonshotai/Kimi-K2.5", + "name": "Kimi-K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-12-15", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 2.5, + "cache_read": 0.05, + "cache_write": 0.625 + }, + "limit": { + "context": 262144, + "output": 8192 + } + }, + { + "id": "nebius/moonshotai/kimi-k2-instruct", + "name": "Kimi-K2-Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2026-01-05", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.4, + "cache_read": 0.05, + "cache_write": 0.625 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "nebius/moonshotai/kimi-k2-thinking", + "name": "Kimi-K2-Thinking", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2026-01-05", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.06, + "cache_write": 0.75 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "nebius/nvidia/llama-3_1-nemotron-ultra-253b-v1", + "name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.8, + "cache_read": 0.06, + "cache_write": 0.75 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nebius/nvidia/nemotron-nano-v2-12b", + "name": "Nemotron-Nano-V2-12b", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-15", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.2, + "cache_read": 0.007, + "cache_write": 0.08 + }, + "limit": { + "context": 32000, + "output": 4096 + } + }, + { + "id": "nebius/nvidia/nvidia-nemotron-3-nano-30b-a3b", + "name": "Nemotron-3-Nano-30B-A3B", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-08-10", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.24, + "cache_read": 0.006, + "cache_write": 0.075 + }, + "limit": { + "context": 32000, + "output": 4096 + } + }, + { + "id": "nebius/openai/gpt-oss-120b", + "name": "gpt-oss-120b", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.015, + "cache_write": 0.18 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/openai/gpt-oss-20b", + "name": "gpt-oss-20b", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.2, + "cache_read": 0.005, + "cache_write": 0.06 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nebius/qwen/qwen2.5-coder-7b-fast", + "name": "Qwen2.5-Coder-7B (Fast)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-09-19", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.09, + "cache_read": 0.003, + "cache_write": 0.03 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.75, + "cache_read": 0.025, + "cache_write": 0.31 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/qwen/qwen3-235b-a22b-instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-10-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 262144, + "output": 8192 + } + }, + { + "id": "nebius/qwen/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-10-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 262144, + "output": 8192 + } + }, + { + "id": "nebius/qwen/qwen3-30b-a3b-instruct", + "name": "Qwen3-30B-A3B-Instruct-2507", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/qwen/qwen3-30b-a3b-thinking", + "name": "Qwen3-30B-A3B-Thinking-2507", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "nebius/qwen/qwen3-32b", + "name": "Qwen3-32B", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/qwen/qwen3-32b-fast", + "name": "Qwen3-32B (Fast)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.6, + "cache_read": 0.02, + "cache_write": 0.25 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder-30B-A3B-Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nebius/qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-10-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 1.8 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "nebius/qwen/qwen3-embedding-8b", + "name": "Qwen3-Embedding-8B", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-10", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 0 + } + }, + { + "id": "nebius/qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 1.2, + "cache_read": 0.015, + "cache_write": 0.18 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "nebius/zai-org/glm-4.5", + "name": "GLM-4.5", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-11-15", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.06, + "cache_write": 0.75 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nebius/zai-org/glm-4.5-air", + "name": "GLM-4.5-Air", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-11-15", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 1.2, + "cache_read": 0.02, + "cache_write": 0.25 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nebius/zai-org/glm-4.7-fp8", + "name": "GLM-4.7 (FP8)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2026-01-15", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0, + "cache_read": 0.04, + "cache_write": 0.5 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nova/nova-2-lite-v1", + "name": "Nova 2 Lite", + "family": "nova-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text", + "image", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "nova/nova-2-pro-v1", + "name": "Nova 2 Pro", + "family": "nova-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-03", + "last_updated": "2026-01-03", + "modalities": { + "input": [ + "text", + "image", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "novita-ai/baichuan/baichuan-m2-32b", + "name": "baichuan-m2-32b", + "family": "baichuan", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.07 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "novita-ai/baidu/ernie-4.5-21B-a3b", + "name": "ERNIE 4.5 21B A3B", + "family": "ernie", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 120000, + "output": 8000 + } + }, + { + "id": "novita-ai/baidu/ernie-4.5-21B-a3b-thinking", + "name": "ERNIE-4.5-21B-A3B-Thinking", + "family": "ernie", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "novita-ai/baidu/ernie-4.5-300b-a47b-paddle", + "name": "ERNIE 4.5 300B A47B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.28, + "output": 1.1 + }, + "limit": { + "context": 123000, + "output": 12000 + } + }, + { + "id": "novita-ai/baidu/ernie-4.5-vl-28b-a3b", + "name": "ERNIE 4.5 VL 28B A3B", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.4, + "output": 5.6 + }, + "limit": { + "context": 30000, + "output": 8000 + } + }, + { + "id": "novita-ai/baidu/ernie-4.5-vl-28b-a3b-thinking", + "name": "ERNIE-4.5-VL-28B-A3B-Thinking", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-26", + "last_updated": "2025-11-26", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.39, + "output": 0.39 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "novita-ai/baidu/ernie-4.5-vl-424b-a47b", + "name": "ERNIE 4.5 VL 424B A47B", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.42, + "output": 1.25 + }, + "limit": { + "context": 123000, + "output": 16000 + } + }, + { + "id": "novita-ai/deepseek/deepseek-ocr", + "name": "DeepSeek-OCR", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-10-24", + "last_updated": "2025-10-24", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.03 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "novita-ai/deepseek/deepseek-ocr-2", + "name": "deepseek/deepseek-ocr-2", + "attachment": true, + "reasoning": false, + "tool_call": false, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.03 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "novita-ai/deepseek/deepseek-prover-v2-671b", + "name": "Deepseek Prover V2 671B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-30", + "last_updated": "2025-04-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 2.5 + }, + "limit": { + "context": 160000, + "output": 160000 + } + }, + { + "id": "novita-ai/deepseek/deepseek-r1", + "name": "DeepSeek R1 0528", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 2.5, + "cache_read": 0.35 + }, + "limit": { + "context": 163840, + "output": 32768 + } + }, + { + "id": "novita-ai/deepseek/deepseek-r1-0528-qwen3-8b", + "name": "DeepSeek R1 0528 Qwen3 8B", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-05-29", + "last_updated": "2025-05-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.06, + "output": 0.09 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "novita-ai/deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill LLama 70B", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.8, + "output": 0.8 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "novita-ai/deepseek/deepseek-r1-turbo", + "name": "DeepSeek R1 (Turbo)\t", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-05", + "last_updated": "2025-03-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 2.5 + }, + "limit": { + "context": 64000, + "output": 16000 + } + }, + { + "id": "novita-ai/deepseek/deepseek-v3", + "name": "DeepSeek V3 0324", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.12, + "cache_read": 0.135 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "novita-ai/deepseek/deepseek-v3-turbo", + "name": "DeepSeek V3 (Turbo)\t", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-05", + "last_updated": "2025-03-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.3 + }, + "limit": { + "context": 64000, + "output": 16000 + } + }, + { + "id": "novita-ai/deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.0, + "cache_read": 0.135 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/deepseek/deepseek-v3.1-terminus", + "name": "Deepseek V3.1 Terminus", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.0, + "cache_read": 0.135 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/deepseek/deepseek-v3.2", + "name": "Deepseek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.269, + "output": 0.4, + "cache_read": 0.1345 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "novita-ai/deepseek/deepseek-v3.2-exp", + "name": "Deepseek V3.2 Exp", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 0.41 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "novita-ai/google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.119, + "output": 0.2 + }, + "limit": { + "context": 98304, + "output": 16384 + } + }, + { + "id": "novita-ai/gryphe/mythomax-l2-13b", + "name": "Mythomax L2 13B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.09 + }, + "limit": { + "context": 4096, + "output": 3200 + } + }, + { + "id": "novita-ai/kwaipilot/kat-coder", + "name": "KAT-Coder-Pro V1(Free)", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "novita-ai/kwaipilot/kat-coder-pro", + "name": "Kat Coder Pro", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-05", + "last_updated": "2026-01-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 + }, + "limit": { + "context": 256000, + "output": 128000 + } + }, + { + "id": "novita-ai/meta-llama/llama-3-70b-instruct", + "name": "Llama3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.51, + "output": 0.74 + }, + "limit": { + "context": 8192, + "output": 8000 + } + }, + { + "id": "novita-ai/meta-llama/llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.04 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "novita-ai/meta-llama/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-07-24", + "last_updated": "2024-07-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.05 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "novita-ai/meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-07", + "last_updated": "2024-12-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.135, + "output": 0.4 + }, + "limit": { + "context": 131072, + "output": 120000 + } + }, + { + "id": "novita-ai/meta-llama/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick Instruct", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-06", + "last_updated": "2025-04-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 0.85 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "novita-ai/meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout Instruct", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-06", + "last_updated": "2025-04-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.18, + "output": 0.59 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "novita-ai/microsoft/wizardlm-2-8x22b", + "name": "Wizardlm 2 8x22B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-04-24", + "last_updated": "2024-04-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.62, + "output": 0.62 + }, + "limit": { + "context": 65535, + "output": 8000 + } + }, + { + "id": "novita-ai/minimax/minimax-m2", + "name": "MiniMax-M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "novita-ai/minimax/minimax-m2.1", + "name": "Minimax M2.1", + "family": "minimax", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "novita-ai/minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 + }, + "limit": { + "context": 204800, + "output": 131100 + } + }, + { + "id": "novita-ai/minimaxai/minimax-m1-80k", + "name": "MiniMax M1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.2 + }, + "limit": { + "context": 1000000, + "output": 40000 + } + }, + { + "id": "novita-ai/mistralai/mistral-nemo", + "name": "Mistral Nemo", + "family": "mistral-nemo", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-07-30", + "last_updated": "2024-07-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.17 + }, + "limit": { + "context": 60288, + "output": 16000 + } + }, + { + "id": "novita-ai/moonshotai/kimi-k2", + "name": "Kimi K2 0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "novita-ai/moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.57, + "output": 2.3 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "novita-ai/moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "novita-ai/moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0, + "cache_read": 0.1 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "novita-ai/nousresearch/hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-06-27", + "last_updated": "2024-06-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.14, + "output": 0.14 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "novita-ai/openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.25 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/openai/gpt-oss-20b", + "name": "OpenAI: GPT OSS 20B", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.15 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/paddlepaddle/paddleocr-vl", + "name": "PaddleOCR-VL", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-10-22", + "last_updated": "2025-10-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.02 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "novita-ai/qwen/qwen-2.5-72b-instruct", + "name": "Qwen 2.5 72B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-10-15", + "last_updated": "2024-10-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.38, + "output": 0.4 + }, + "limit": { + "context": 32000, + "output": 8192 + } + }, + { + "id": "novita-ai/qwen/qwen-mt-plus", + "name": "Qwen MT Plus", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-03", + "last_updated": "2025-09-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.75 + }, + "limit": { + "context": 16384, + "output": 8192 + } + }, + { + "id": "novita-ai/qwen/qwen2.5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.07 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "novita-ai/qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.8, + "output": 0.8 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 40960, + "output": 20000 + } + }, + { + "id": "novita-ai/qwen/qwen3-235b-a22b-instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.58 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "novita-ai/qwen/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22b Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 3.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.45 + }, + "limit": { + "context": 40960, + "output": 20000 + } + }, + { + "id": "novita-ai/qwen/qwen3-32b-fp8", + "name": "Qwen3 32B", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.45 + }, + "limit": { + "context": 40960, + "output": 20000 + } + }, + { + "id": "novita-ai/qwen/qwen3-4b-fp8", + "name": "Qwen3 4B", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.03 + }, + "limit": { + "context": 128000, + "output": 20000 + } + }, + { + "id": "novita-ai/qwen/qwen3-8b-fp8", + "name": "Qwen3 8B", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.035, + "output": 0.138 + }, + "limit": { + "context": 128000, + "output": 20000 + } + }, + { + "id": "novita-ai/qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30b A3B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-09", + "last_updated": "2025-10-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.27 + }, + "limit": { + "context": 160000, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.3 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "novita-ai/qwen/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-03", + "last_updated": "2026-02-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.5 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "novita-ai/qwen/qwen3-max", + "name": "Qwen3 Max", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.11, + "output": 8.45 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "novita-ai/qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 1.5 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 1.5 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3-omni-30b-a3b-instruct", + "name": "Qwen3 Omni 30B A3B Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "modalities": { + "input": [ + "text", + "video", + "audio", + "image" + ], + "output": [ + "text", + "audio" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.97 + }, + "limit": { + "context": 65536, + "output": 16384 + } + }, + { + "id": "novita-ai/qwen/qwen3-omni-30b-a3b-thinking", + "name": "Qwen3 Omni 30B A3B Thinking", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "modalities": { + "input": [ + "text", + "audio", + "video", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 0.97 + }, + "limit": { + "context": 65536, + "output": 16384 + } + }, + { + "id": "novita-ai/qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.5 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.98, + "output": 3.95 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3-vl-30b-a3b-instruct", + "name": "qwen/qwen3-vl-30b-a3b-instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", + "modalities": { + "input": [ + "text", + "video", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.7 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3-vl-30b-a3b-thinking", + "name": "qwen/qwen3-vl-30b-a3b-thinking", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3-vl-8b-instruct", + "name": "qwen/qwen3-vl-8b-instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-17", + "last_updated": "2025-10-17", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.08, + "output": 0.5 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.6 + }, + "limit": { + "context": 262144, + "output": 64000 + } + }, + { + "id": "novita-ai/sao10k/L3-8B-Stheno-v3.2", + "name": "L3 8B Stheno V3.2", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-29", + "last_updated": "2024-11-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.05 + }, + "limit": { + "context": 8192, + "output": 32000 + } + }, + { + "id": "novita-ai/sao10k/l3-70b-euryale-v2.1", + "name": "L3 70B Euryale V2.1\t", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-06-18", + "last_updated": "2024-06-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.48, + "output": 1.48 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "novita-ai/sao10k/l3-8b-lunaris", + "name": "Sao10k L3 8B Lunaris\t", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-11-28", + "last_updated": "2024-11-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.05 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "novita-ai/sao10k/l31-70b-euryale-v2.2", + "name": "L31 70B Euryale V2.2", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-19", + "last_updated": "2024-09-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.48, + "output": 1.48 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "novita-ai/skywork/r1v4-lite", + "name": "Skywork R1V4-Lite", + "family": "skywork", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "novita-ai/xiaomimimo/mimo-v2-flash", + "name": "XiaomiMiMo/MiMo-V2-Flash", + "family": "mimo", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.3 + }, + "limit": { + "context": 262144, + "output": 32000 + } + }, + { + "id": "novita-ai/zai-org/autoglm-phone-9b-multilingual", + "name": "AutoGLM-Phone-9B-Multilingual", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-10", + "last_updated": "2025-12-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.035, + "output": 0.138 + }, + "limit": { + "context": 65536, + "output": 65536 + } + }, + { + "id": "novita-ai/zai-org/glm-4.5", + "name": "GLM-4.5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 + }, + "limit": { + "context": 131072, + "output": 98304 + } + }, + { + "id": "novita-ai/zai-org/glm-4.5-air", + "name": "GLM 4.5 Air", + "family": "glm-air", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-10-13", + "last_updated": "2025-10-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.85 + }, + "limit": { + "context": 131072, + "output": 98304 + } + }, + { + "id": "novita-ai/zai-org/glm-4.5v", + "name": "GLM 4.5V", + "family": "glmv", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", + "modalities": { + "input": [ + "text", + "video", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.8, + "cache_read": 0.11 + }, + "limit": { + "context": 65536, + "output": 16384 + } + }, + { + "id": "novita-ai/zai-org/glm-4.6", + "name": "GLM 4.6", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.2, + "cache_read": 0.11 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "novita-ai/zai-org/glm-4.6v", + "name": "GLM 4.6V", + "family": "glmv", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "modalities": { + "input": [ + "text", + "video", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.9, + "cache_read": 0.055 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "novita-ai/zai-org/glm-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "novita-ai/zai-org/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.4, + "cache_read": 0.01 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "novita-ai/zai-org/glm-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.2, + "cache_read": 0.2 + }, + "limit": { + "context": 202800, + "output": 131072 + } + }, + { + "id": "nvidia/black-forest-labs/flux.1-dev", + "name": "FLUX.1-dev", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2024-08-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 4096, + "output": 0 + } + }, + { + "id": "nvidia/deepseek-ai/deepseek-coder-6.7b-instruct", + "name": "Deepseek Coder 6.7b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2023-10-29", + "last_updated": "2023-10-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/deepseek-ai/deepseek-r1", + "name": "Deepseek R1", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/deepseek-ai/deepseek-v3.1", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-08-20", + "last_updated": "2025-08-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nvidia/deepseek-ai/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nvidia/deepseek-ai/deepseek-v3.2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "nvidia/google/codegemma-1.1-7b", + "name": "Codegemma 1.1 7b", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-04-30", + "last_updated": "2024-04-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/google/codegemma-7b", + "name": "Codegemma 7b", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-03-21", + "last_updated": "2024-03-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/google/gemma-2-27b-it", + "name": "Gemma 2 27b It", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-06-24", + "last_updated": "2024-06-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/google/gemma-2-2b-it", + "name": "Gemma 2 2b It", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/google/gemma-3-12b-it", + "name": "Gemma 3 12b It", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/google/gemma-3-1b-it", + "name": "Gemma 3 1b It", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-10", + "last_updated": "2025-03-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/google/gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "family": "gemma", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nvidia/google/gemma-3n-e2b-it", + "name": "Gemma 3n E2b It", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-06-12", + "last_updated": "2025-06-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/google/gemma-3n-e4b-it", + "name": "Gemma 3n E4b It", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/codellama-70b", + "name": "Codellama 70b", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-01-29", + "last_updated": "2024-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/llama-3.1-405b-instruct", + "name": "Llama 3.1 405b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/llama-3.1-70b-instruct", + "name": "Llama 3.1 70b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11b Vision Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-26", + "last_updated": "2024-11-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/llama-4-maverick-17b-128e-instruct", + "name": "Llama 4 Maverick 17b 128e Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-02", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17b 16e Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-02", + "release_date": "2025-04-02", + "last_updated": "2025-04-02", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/llama3-70b-instruct", + "name": "Llama3 70b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-04-17", + "last_updated": "2024-04-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/meta/llama3-8b-instruct", + "name": "Llama3 8b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-04-17", + "last_updated": "2024-04-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/microsoft/phi-3-medium-128k-instruct", + "name": "Phi 3 Medium 128k Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-05-07", + "last_updated": "2024-05-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/microsoft/phi-3-medium-4k-instruct", + "name": "Phi 3 Medium 4k Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-05-07", + "last_updated": "2024-05-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 4000, + "output": 4096 + } + }, + { + "id": "nvidia/microsoft/phi-3-small-128k-instruct", + "name": "Phi 3 Small 128k Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-05-07", + "last_updated": "2024-05-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/microsoft/phi-3-small-8k-instruct", + "name": "Phi 3 Small 8k Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2024-05-07", + "last_updated": "2024-05-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8000, + "output": 4096 + } + }, + { + "id": "nvidia/microsoft/phi-3-vision-128k-instruct", + "name": "Phi 3 Vision 128k Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-05-19", + "last_updated": "2024-05-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/microsoft/phi-3.5-moe-instruct", + "name": "Phi 3.5 Moe Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-08-17", + "last_updated": "2024-08-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/microsoft/phi-3.5-vision-instruct", + "name": "Phi 3.5 Vision Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-08-16", + "last_updated": "2024-08-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/microsoft/phi-4-mini-instruct", + "name": "Phi-4-Mini", + "family": "phi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nvidia/minimaxai/minimax-m2", + "name": "MiniMax-M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-10-27", + "last_updated": "2025-10-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "nvidia/minimaxai/minimax-m2.1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "nvidia/mistralai/codestral-22b-instruct-v0.1", + "name": "Codestral 22b Instruct V0.1", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-05-29", + "last_updated": "2024-05-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/mistralai/devstral-2-123b-instruct", + "name": "Devstral-2-123B-Instruct-2512", + "family": "devstral", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "nvidia/mistralai/mamba-codestral-7b-v0.1", + "name": "Mamba Codestral 7b V0.1", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/mistralai/ministral-14b-instruct", + "name": "Ministral 3 14B Instruct 2512", + "family": "ministral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-08", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "nvidia/mistralai/mistral-large-2-instruct", + "name": "Mistral Large 2 Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-24", + "last_updated": "2024-07-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/mistralai/mistral-large-3-675b-instruct", + "name": "Mistral Large 3 675B Instruct 2512", + "family": "mistral-large", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "nvidia/mistralai/mistral-small-3.1-24b-instruct", + "name": "Mistral Small 3.1 24b Instruct 2503", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-11", + "last_updated": "2025-03-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-01", + "release_date": "2025-01-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nvidia/moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "nvidia/moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "nvidia/nvidia/cosmos-nemotron-34b", + "name": "Cosmos Nemotron 34B", + "family": "nemotron", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nvidia/nvidia/llama-3.1-nemotron-51b-instruct", + "name": "Llama 3.1 Nemotron 51b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-22", + "last_updated": "2024-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/nvidia/llama-3.1-nemotron-70b-instruct", + "name": "Llama 3.1 Nemotron 70b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-10-12", + "last_updated": "2024-10-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/nvidia/llama-3.1-nemotron-ultra-253b-v1", + "name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nvidia/nvidia/llama-3.3-nemotron-super-49b-v1", + "name": "Llama 3.3 Nemotron Super 49b V1", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-16", + "last_updated": "2025-03-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/nvidia/llama-3.3-nemotron-super-49b-v1.5", + "name": "Llama 3.3 Nemotron Super 49b V1.5", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-16", + "last_updated": "2025-03-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/nvidia/llama-embed-nemotron-8b", + "name": "Llama Embed Nemotron 8B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2025-03", + "release_date": "2025-03-18", + "last_updated": "2025-03-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 2048 + } + }, + { + "id": "nvidia/nvidia/llama3-chatqa-1.5-70b", + "name": "Llama3 Chatqa 1.5 70b", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-04-28", + "last_updated": "2024-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/nvidia/nemoretriever-ocr-v1", + "name": "NeMo Retriever OCR v1", + "family": "nemoretriever", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 0, + "output": 4096 + } + }, + { + "id": "nvidia/nvidia/nemotron-3-nano-30b-a3b", + "name": "nemotron-3-nano-30b-a3b", + "family": "nemotron", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-12", + "last_updated": "2024-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "nvidia/nvidia/nemotron-4-340b-instruct", + "name": "Nemotron 4 340b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-06-13", + "last_updated": "2024-06-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/nvidia/nvidia-nemotron-nano-9b-v2", + "name": "nvidia-nemotron-nano-9b-v2", + "family": "nemotron", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "nvidia/nvidia/parakeet-tdt-0.6b-v2", + "name": "Parakeet TDT 0.6B v2", + "family": "parakeet", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 0, + "output": 4096 + } + }, + { + "id": "nvidia/openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "family": "gpt-oss", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "nvidia/openai/whisper-large-v3", + "name": "Whisper Large v3", + "family": "whisper", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 0, + "output": 4096 + } + }, + { + "id": "nvidia/qwen/qwen2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-06", + "last_updated": "2024-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/qwen/qwen2.5-coder-7b-instruct", + "name": "Qwen2.5 Coder 7b Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-17", + "last_updated": "2024-09-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/qwen/qwen3-235b-a22b", + "name": "Qwen3-235B-A22B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "nvidia/qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "nvidia/qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "nvidia/qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "nvidia/qwen/qwq-32b", + "name": "Qwq 32b", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-05", + "last_updated": "2025-03-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "nvidia/z-ai/glm4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "nvidia/z-ai/glm5", + "name": "GLM5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 202752, + "output": 131000 + } + }, + { + "id": "ollama-cloud/cogito-2.1:671b", + "name": "cogito-2.1:671b", + "family": "cogito", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-11-19", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 163840, + "output": 32000 + } + }, + { + "id": "ollama-cloud/deepseek-v3.1:671b", + "name": "deepseek-v3.1:671b", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-08-21", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "ollama-cloud/deepseek-v3.2", + "name": "deepseek-v3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-06-15", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "ollama-cloud/devstral-2:123b", + "name": "devstral-2:123b", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2025-12-09", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "ollama-cloud/devstral-small-2:24b", + "name": "devstral-small-2:24b", + "family": "devstral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "release_date": "2025-12-09", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "ollama-cloud/gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "family": "gemini-flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "ollama-cloud/gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "release_date": "2025-11-18", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 1048576, + "output": 64000 + } + }, + { + "id": "ollama-cloud/gemma3:12b", + "name": "gemma3:12b", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "release_date": "2024-12-01", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "ollama-cloud/gemma3:27b", + "name": "gemma3:27b", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "release_date": "2025-07-27", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "ollama-cloud/gemma3:4b", + "name": "gemma3:4b", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "release_date": "2024-12-01", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "ollama-cloud/glm-4.6", + "name": "glm-4.6", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-09-29", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "ollama-cloud/glm-4.7", + "name": "glm-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-12-22", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "ollama-cloud/glm-5", + "name": "glm-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "ollama-cloud/gpt-oss:120b", + "name": "gpt-oss:120b", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-08-05", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "ollama-cloud/gpt-oss:20b", + "name": "gpt-oss:20b", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-08-05", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "ollama-cloud/kimi-k2-thinking", + "name": "kimi-k2-thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "ollama-cloud/kimi-k2.5", + "name": "kimi-k2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "ollama-cloud/kimi-k2:1t", + "name": "kimi-k2:1t", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "ollama-cloud/minimax-m2", + "name": "minimax-m2", + "family": "minimax", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2025-10-23", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 204800, + "output": 128000 + } + }, + { + "id": "ollama-cloud/minimax-m2.1", + "name": "minimax-m2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-12-23", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "ollama-cloud/minimax-m2.5", + "name": "minimax-m2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "ollama-cloud/ministral-3:14b", + "name": "ministral-3:14b", + "family": "ministral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "release_date": "2024-12-01", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 128000 + } + }, + { + "id": "ollama-cloud/ministral-3:3b", + "name": "ministral-3:3b", + "family": "ministral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "release_date": "2024-10-22", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 128000 + } + }, + { + "id": "ollama-cloud/ministral-3:8b", + "name": "ministral-3:8b", + "family": "ministral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "release_date": "2024-12-01", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 128000 + } + }, + { + "id": "ollama-cloud/mistral-large-3:675b", + "name": "mistral-large-3:675b", + "family": "mistral-large", + "attachment": true, + "reasoning": false, + "tool_call": true, + "release_date": "2025-12-02", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "ollama-cloud/nemotron-3-nano:30b", + "name": "nemotron-3-nano:30b", + "family": "nemotron", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-12-15", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 1048576, + "output": 131072 + } + }, + { + "id": "ollama-cloud/qwen3-coder-next", + "name": "qwen3-coder-next", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2026-02-02", + "last_updated": "2026-02-08", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "ollama-cloud/qwen3-coder:480b", + "name": "qwen3-coder:480b", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2025-07-22", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "ollama-cloud/qwen3-next:80b", + "name": "qwen3-next:80b", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-09-15", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "ollama-cloud/qwen3-vl:235b", + "name": "qwen3-vl:235b", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "release_date": "2025-09-22", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "ollama-cloud/qwen3-vl:235b-instruct", + "name": "qwen3-vl:235b-instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "release_date": "2025-09-22", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "ollama-cloud/qwen3.5:397b", + "name": "qwen3.5:397b", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 262144, + "output": 81920 + } + }, + { + "id": "ollama-cloud/rnj-1:8b", + "name": "rnj-1:8b", + "family": "rnj", + "attachment": false, + "reasoning": false, + "tool_call": true, + "release_date": "2025-12-06", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": {}, + "limit": { + "context": 32768, + "output": 4096 + } + }, + { + "id": "openai/codex-mini", + "name": "Codex Mini", + "family": "gpt-codex-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.5, + "output": 6.0, + "cache_read": 0.375 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 + }, + "limit": { + "context": 16385, + "output": 4096 + } + }, + { + "id": "openai/gpt-4", + "name": "GPT-4", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 30.0, + "output": 60.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 30.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "openai/gpt-4o", + "name": "GPT-4o (2024-11-20)", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 10.0, + "cache_read": 1.25 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "openai/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5-chat", + "name": "GPT-5 Chat (latest)", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "family": "gpt-codex", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5-pro", + "name": "GPT-5 Pro", + "family": "gpt-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 120.0 + }, + "limit": { + "context": 400000, + "output": 272000 + } + }, + { + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "family": "gpt-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 21.0, + "output": 168.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openai/gpt-5.3-codex-spark", + "name": "GPT-5.3 Codex Spark", + "family": "gpt-codex-spark", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "openai/o1", + "name": "o1", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 60.0, + "cache_read": 7.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openai/o1-mini", + "name": "o1-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 128000, + "output": 65536 + } + }, + { + "id": "openai/o1-preview", + "name": "o1-preview", + "family": "o", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 60.0, + "cache_read": 7.5 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "openai/o1-pro", + "name": "o1-pro", + "family": "o-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2025-03-19", + "last_updated": "2025-03-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 150.0, + "output": 600.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openai/o3", + "name": "o3", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 10.0, + "output": 40.0, + "cache_read": 2.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openai/o3-mini", + "name": "o3-mini", + "family": "o-mini", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openai/o3-pro", + "name": "o3-pro", + "family": "o-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 20.0, + "output": 80.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openai/o4-mini", + "name": "o4-mini", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openai/o4-mini-deep-research", + "name": "o4-mini-deep-research", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openai/text-embedding-3-large", + "name": "text-embedding-3-large", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.13, + "output": 0.0 + }, + "limit": { + "context": 8191, + "output": 3072 + } + }, + { + "id": "openai/text-embedding-3-small", + "name": "text-embedding-3-small", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.02, + "output": 0.0 + }, + "limit": { + "context": 8191, + "output": 1536 + } + }, + { + "id": "openai/text-embedding-ada-002", + "name": "text-embedding-ada-002", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2022-12", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 1536 + } + }, + { + "id": "opencode/big-pickle", + "name": "Big Pickle", + "family": "big-pickle", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-10-17", + "last_updated": "2025-10-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "opencode/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "opencode/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "opencode/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "opencode/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "opencode/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "opencode/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "opencode/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "opencode/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "opencode/gemini-3-flash", + "name": "Gemini 3 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0, + "cache_read": 0.05 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "opencode/gemini-3-pro", + "name": "Gemini 3 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "opencode/gemini-3.1-pro", + "name": "Gemini 3.1 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "opencode/glm-4.6", + "name": "GLM-4.6", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "opencode/glm-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "opencode/glm-4.7-free", + "name": "GLM-4.7 Free", + "family": "glm-free", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "opencode/glm-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.2, + "cache_read": 0.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "opencode/glm-5-free", + "name": "GLM-5 Free", + "family": "glm-free", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "opencode/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "opencode/gpt-5-codex", + "name": "GPT-5 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "opencode/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "opencode/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "opencode/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "opencode/gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "opencode/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "opencode/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "opencode/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "opencode/grok-code", + "name": "Grok Code Fast 1", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-20", + "last_updated": "2025-08-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "opencode/kimi-k2", + "name": "Kimi K2", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "opencode/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "opencode/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0, + "cache_read": 0.08 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "opencode/kimi-k2.5-free", + "name": "Kimi K2.5 Free", + "family": "kimi-free", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "opencode/minimax-m2.1", + "name": "MiniMax M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.1 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "opencode/minimax-m2.1-free", + "name": "MiniMax M2.1 Free", + "family": "minimax-free", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "opencode/minimax-m2.5", + "name": "MiniMax M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "opencode/minimax-m2.5-free", + "name": "MiniMax M2.5 Free", + "family": "minimax-free", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0, + "cache_read": 0.0 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "opencode/qwen3-coder", + "name": "Qwen3 Coder", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.45, + "output": 1.8 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "opencode/trinity-large-preview-free", + "name": "Trinity Large Preview", + "family": "trinity", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-01-28", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/allenai/molmo-2-8b:free", + "name": "Molmo2 8B (free)", + "family": "allenai", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-01-09", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 36864, + "output": 36864 + } + }, + { + "id": "openrouter/anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "openrouter/anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-01", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "openrouter/anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "openrouter/anthropic/claude-opus-4", + "name": "Claude Opus 4", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "openrouter/anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "openrouter/anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05-30", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "openrouter/anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05-30", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "openrouter/anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "openrouter/anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "openrouter/anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "openrouter/arcee-ai/trinity-large-preview:free", + "name": "Trinity Large Preview", + "family": "trinity", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-01-28", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/arcee-ai/trinity-mini:free", + "name": "Trinity Mini", + "family": "trinity-mini", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-01-28", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/black-forest-labs/flux.2-flex", + "name": "FLUX.2 Flex", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-11-25", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 67344, + "output": 67344 + } + }, + { + "id": "openrouter/black-forest-labs/flux.2-klein-4b", + "name": "FLUX.2 Klein 4B", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-01-14", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "openrouter/black-forest-labs/flux.2-max", + "name": "FLUX.2 Max", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-12-16", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 46864, + "output": 46864 + } + }, + { + "id": "openrouter/black-forest-labs/flux.2-pro", + "name": "FLUX.2 Pro", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-11-25", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 46864, + "output": 46864 + } + }, + { + "id": "openrouter/bytedance-seed/seedream-4.5", + "name": "Seedream 4.5", + "family": "seed", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-12-23", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 4096, + "output": 4096 + } + }, + { + "id": "openrouter/cognitivecomputations/dolphin-mistral-24b-venice-edition:free", + "name": "Uncensored (free)", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-07-09", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "openrouter/cognitivecomputations/dolphin3.0-mistral-24b", + "name": "Dolphin3.0 Mistral 24B", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-02-13", + "last_updated": "2025-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "openrouter/cognitivecomputations/dolphin3.0-r1-mistral-24b", + "name": "Dolphin3.0 R1 Mistral 24B", + "family": "mistral", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-02-13", + "last_updated": "2025-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "openrouter/deepseek/deepseek-chat-v3", + "name": "DeepSeek V3 0324", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 16384, + "output": 8192 + } + }, + { + "id": "openrouter/deepseek/deepseek-chat-v3.1", + "name": "DeepSeek-V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "openrouter/deepseek/deepseek-r1-0528-qwen3-8b:free", + "name": "Deepseek R1 0528 Qwen3 8B (free)", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-29", + "last_updated": "2025-05-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/deepseek/deepseek-r1-0528:free", + "name": "R1 0528 (free)", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "openrouter/deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-01-23", + "last_updated": "2025-01-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "openrouter/deepseek/deepseek-r1-distill-qwen-14b", + "name": "DeepSeek R1 Distill Qwen 14B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-01-29", + "last_updated": "2025-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 64000, + "output": 8192 + } + }, + { + "id": "openrouter/deepseek/deepseek-r1:free", + "name": "R1 (free)", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "openrouter/deepseek/deepseek-v3-base:free", + "name": "DeepSeek V3 Base (free)", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-03-29", + "last_updated": "2025-03-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "openrouter/deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "openrouter/deepseek/deepseek-v3.1-terminus:exacto", + "name": "DeepSeek V3.1 Terminus (exacto)", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "openrouter/deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.28, + "output": 0.4 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "openrouter/deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek V3.2 Speciale", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 0.41 + }, + "limit": { + "context": 163840, + "output": 65536 + } + }, + { + "id": "openrouter/featherless/qwerky-72b", + "name": "Qwerky 72B", + "family": "qwerky", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "openrouter/google/gemini-2.0-flash-001", + "name": "Gemini 2.0 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "openrouter/google/gemini-2.0-flash-exp:free", + "name": "Gemini 2.0 Flash Experimental (free)", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 1048576, + "output": 1048576 + } + }, + { + "id": "openrouter/google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-07-17", + "last_updated": "2025-07-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.0375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "openrouter/google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "openrouter/google/gemini-2.5-flash-lite-preview-09", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "openrouter/google/gemini-2.5-flash-preview-09", + "name": "Gemini 2.5 Flash Preview 09-25", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.031 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "openrouter/google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "openrouter/google/gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "openrouter/google/gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "openrouter/google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0, + "cache_read": 0.05 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "openrouter/google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0 + }, + "limit": { + "context": 1050000, + "output": 66000 + } + }, + { + "id": "openrouter/google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "openrouter/google/gemma-2-9b-it", + "name": "Gemma 2 9B", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-06-28", + "last_updated": "2024-06-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.09 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "openrouter/google/gemma-3-12b-it", + "name": "Gemma 3 12B", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.03, + "output": 0.1 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/google/gemma-3-12b-it:free", + "name": "Gemma 3 12B (free)", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "openrouter/google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.15 + }, + "limit": { + "context": 96000, + "output": 96000 + } + }, + { + "id": "openrouter/google/gemma-3-27b-it:free", + "name": "Gemma 3 27B (free)", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "openrouter/google/gemma-3-4b-it", + "name": "Gemma 3 4B", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.01703, + "output": 0.06815 + }, + "limit": { + "context": 96000, + "output": 96000 + } + }, + { + "id": "openrouter/google/gemma-3-4b-it:free", + "name": "Gemma 3 4B (free)", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "openrouter/google/gemma-3n-e2b-it:free", + "name": "Gemma 3n 2B (free)", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 2000 + } + }, + { + "id": "openrouter/google/gemma-3n-e4b-it", + "name": "Gemma 3n 4B", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.04 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "openrouter/google/gemma-3n-e4b-it:free", + "name": "Gemma 3n 4B (free)", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 2000 + } + }, + { + "id": "openrouter/kwaipilot/kat-coder-pro:free", + "name": "Kat Coder Pro (free)", + "family": "kat-coder", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-10", + "last_updated": "2025-11-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 65536 + } + }, + { + "id": "openrouter/liquid/lfm-2.5-1.2b-instruct:free", + "name": "LFM2.5-1.2B-Instruct (free)", + "family": "liquid", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-01-20", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "openrouter/liquid/lfm-2.5-1.2b-thinking:free", + "name": "LFM2.5-1.2B-Thinking (free)", + "family": "liquid", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2026-01-20", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "openrouter/meta-llama/llama-3.1-405b-instruct:free", + "name": "Llama 3.1 405B Instruct (free)", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2024-07-23", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/meta-llama/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11B Vision Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "openrouter/meta-llama/llama-3.2-3b-instruct:free", + "name": "Llama 3.2 3B Instruct (free)", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/meta-llama/llama-3.3-70b-instruct:free", + "name": "Llama 3.3 70B Instruct (free)", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/meta-llama/llama-4-scout:free", + "name": "Llama 4 Scout (free)", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 64000, + "output": 64000 + } + }, + { + "id": "openrouter/microsoft/mai-ds-r1:free", + "name": "MAI DS R1 (free)", + "family": "mai", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-21", + "last_updated": "2025-04-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "openrouter/minimax/minimax-01", + "name": "MiniMax-01", + "family": "minimax", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-15", + "last_updated": "2025-01-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.1 + }, + "limit": { + "context": 1000000, + "output": 1000000 + } + }, + { + "id": "openrouter/minimax/minimax-m1", + "name": "MiniMax M1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.2 + }, + "limit": { + "context": 1000000, + "output": 40000 + } + }, + { + "id": "openrouter/minimax/minimax-m2", + "name": "MiniMax M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-23", + "last_updated": "2025-10-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.28, + "output": 1.15, + "cache_read": 0.28, + "cache_write": 1.15 + }, + "limit": { + "context": 196600, + "output": 118000 + } + }, + { + "id": "openrouter/minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "openrouter/minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "openrouter/mistralai/codestral", + "name": "Codestral 2508", + "family": "codestral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "openrouter/mistralai/devstral", + "name": "Devstral 2 2512", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "openrouter/mistralai/devstral-2512:free", + "name": "Devstral 2 2512 (free)", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-12", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "openrouter/mistralai/devstral-medium", + "name": "Devstral Medium", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/mistralai/devstral-small", + "name": "Devstral Small 1.1", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/mistralai/devstral-small-2505:free", + "name": "Devstral Small 2505 (free)", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-21", + "last_updated": "2025-05-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "openrouter/mistralai/mistral-7b-instruct:free", + "name": "Mistral 7B Instruct (free)", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-05", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "openrouter/mistralai/mistral-medium-3", + "name": "Mistral Medium 3", + "family": "mistral-medium", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/mistralai/mistral-medium-3.1", + "name": "Mistral Medium 3.1", + "family": "mistral-medium", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "openrouter/mistralai/mistral-nemo:free", + "name": "Mistral Nemo (free)", + "family": "mistral-nemo", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-07-19", + "last_updated": "2024-07-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/mistralai/mistral-small-3.1-24b-instruct", + "name": "Mistral Small 3.1 24B Instruct", + "family": "mistral-small", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "openrouter/mistralai/mistral-small-3.2-24b-instruct", + "name": "Mistral Small 3.2 24B Instruct", + "family": "mistral-small", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 96000, + "output": 8192 + } + }, + { + "id": "openrouter/mistralai/mistral-small-3.2-24b-instruct:free", + "name": "Mistral Small 3.2 24B (free)", + "family": "mistral-small", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 96000, + "output": 96000 + } + }, + { + "id": "openrouter/moonshotai/kimi-dev-72b:free", + "name": "Kimi Dev 72b (free)", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/moonshotai/kimi-k2", + "name": "Kimi K2 Instruct 0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "openrouter/moonshotai/kimi-k2-0905:exacto", + "name": "Kimi K2 Instruct 0905 (exacto)", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5 + }, + "limit": { + "context": 262144, + "output": 16384 + } + }, + { + "id": "openrouter/moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "openrouter/moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.0, + "cache_read": 0.1 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "openrouter/moonshotai/kimi-k2:free", + "name": "Kimi K2 (free)", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32800, + "output": 32800 + } + }, + { + "id": "openrouter/nousresearch/deephermes-3-llama-3-8b-preview", + "name": "DeepHermes 3 Llama 3 8B Preview", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-02-28", + "last_updated": "2025-02-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "openrouter/nousresearch/hermes-3-llama-3.1-405b:free", + "name": "Hermes 3 405B Instruct (free)", + "family": "hermes", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-08-16", + "last_updated": "2024-08-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/nousresearch/hermes-4-405b", + "name": "Hermes 4 405B", + "family": "hermes", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-08-25", + "last_updated": "2025-08-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/nousresearch/hermes-4-70b", + "name": "Hermes 4 70B", + "family": "hermes", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-08-25", + "last_updated": "2025-08-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.13, + "output": 0.4 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/nvidia/nemotron-3-nano-30b-a3b:free", + "name": "Nemotron 3 Nano 30B A3B (free)", + "family": "nemotron", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-12-14", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "openrouter/nvidia/nemotron-nano-12b-v2-vl:free", + "name": "Nemotron Nano 12B 2 VL (free)", + "family": "nemotron", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-10-28", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "openrouter/nvidia/nemotron-nano-9b-v2", + "name": "nvidia-nemotron-nano-9b-v2", + "family": "nemotron", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.04, + "output": 0.16 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/nvidia/nemotron-nano-9b-v2:free", + "name": "Nemotron Nano 9B V2 (free)", + "family": "nemotron", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2025-09-05", + "last_updated": "2025-08-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "openrouter/openai/gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "openrouter/openai/gpt-4o-mini", + "name": "GPT-4o-mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "openrouter/openai/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5-chat", + "name": "GPT-5 Chat (latest)", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5-codex", + "name": "GPT-5 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-01", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5-image", + "name": "GPT-5 Image", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-01", + "release_date": "2025-10-14", + "last_updated": "2025-10-14", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 10.0, + "cache_read": 1.25 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.4 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5-pro", + "name": "GPT-5 Pro", + "family": "gpt-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 120.0 + }, + "limit": { + "context": 400000, + "output": 272000 + } + }, + { + "id": "openrouter/openai/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "openrouter/openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-Max", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 9.0, + "cache_read": 0.11 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 100000 + } + }, + { + "id": "openrouter/openai/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "openrouter/openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "family": "gpt-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 21.0, + "output": 168.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "openrouter/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.072, + "output": 0.28 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "openrouter/openai/gpt-oss-120b:exacto", + "name": "GPT OSS 120B (exacto)", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.24 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "openrouter/openai/gpt-oss-120b:free", + "name": "gpt-oss-120b (free)", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "openrouter/openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.2 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "openrouter/openai/gpt-oss-20b:free", + "name": "gpt-oss-20b (free)", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "openrouter/openai/gpt-oss-safeguard-20b", + "name": "GPT OSS Safeguard 20B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-29", + "last_updated": "2025-10-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.075, + "output": 0.3 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "openrouter/openai/o4-mini", + "name": "o4 Mini", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "openrouter/openrouter/aurora-alpha", + "name": "Aurora Alpha", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-09", + "last_updated": "2026-02-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 50000 + } + }, + { + "id": "openrouter/openrouter/sherlock-dash-alpha", + "name": "Sherlock Dash Alpha", + "family": "sherlock", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-15", + "last_updated": "2025-12-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 1840000, + "output": 0 + } + }, + { + "id": "openrouter/openrouter/sherlock-think-alpha", + "name": "Sherlock Think Alpha", + "family": "sherlock", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-15", + "last_updated": "2025-12-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 1840000, + "output": 0 + } + }, + { + "id": "openrouter/prime-intellect/intellect-3", + "name": "Intellect 3", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.1 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "openrouter/qwen/qwen-2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "openrouter/qwen/qwen-2.5-vl-7b-instruct:free", + "name": "Qwen2.5-VL 7B Instruct (free)", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02", + "release_date": "2024-08-28", + "last_updated": "2024-08-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "openrouter/qwen/qwen2.5-vl-32b-instruct:free", + "name": "Qwen2.5 VL 32B Instruct (free)", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "openrouter/qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-02-01", + "last_updated": "2025-02-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "openrouter/qwen/qwen2.5-vl-72b-instruct:free", + "name": "Qwen2.5 VL 72B Instruct (free)", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02", + "release_date": "2025-02-01", + "last_updated": "2025-02-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "openrouter/qwen/qwen3-14b:free", + "name": "Qwen3 14B (free)", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "openrouter/qwen/qwen3-235b-a22b-07-25", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.85 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "openrouter/qwen/qwen3-235b-a22b-07-25:free", + "name": "Qwen3 235B A22B Instruct 2507 (free)", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "openrouter/qwen/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.078, + "output": 0.312 + }, + "limit": { + "context": 262144, + "output": 81920 + } + }, + { + "id": "openrouter/qwen/qwen3-235b-a22b:free", + "name": "Qwen3 235B A22B (free)", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "openrouter/qwen/qwen3-30b-a3b-instruct", + "name": "Qwen3 30B A3B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "openrouter/qwen/qwen3-30b-a3b-thinking", + "name": "Qwen3 30B A3B Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "openrouter/qwen/qwen3-30b-a3b:free", + "name": "Qwen3 30B A3B (free)", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "openrouter/qwen/qwen3-32b:free", + "name": "Qwen3 32B (free)", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "openrouter/qwen/qwen3-4b:free", + "name": "Qwen3 4B (free)", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-30", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "openrouter/qwen/qwen3-8b:free", + "name": "Qwen3 8B (free)", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 40960, + "output": 40960 + } + }, + { + "id": "openrouter/qwen/qwen3-coder", + "name": "Qwen3 Coder", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "openrouter/qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.27 + }, + "limit": { + "context": 160000, + "output": 65536 + } + }, + { + "id": "openrouter/qwen/qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.5 + }, + "limit": { + "context": 128000, + "output": 66536 + } + }, + { + "id": "openrouter/qwen/qwen3-coder:exacto", + "name": "Qwen3 Coder (exacto)", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.38, + "output": 1.53 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "openrouter/qwen/qwen3-coder:free", + "name": "Qwen3 Coder 480B A35B Instruct (free)", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "openrouter/qwen/qwen3-max", + "name": "Qwen3 Max", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.2, + "output": 6.0 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "openrouter/qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.14, + "output": 1.4 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "openrouter/qwen/qwen3-next-80b-a3b-instruct:free", + "name": "Qwen3 Next 80B A3B Instruct (free)", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "openrouter/qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.14, + "output": 1.4 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "openrouter/qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.6 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "openrouter/qwen/qwen3.5-plus-02-15", + "name": "Qwen3.5 Plus 2026-02-15", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.4 + }, + "limit": { + "context": 1000000, + "output": 65536 + } + }, + { + "id": "openrouter/qwen/qwq-32b:free", + "name": "QwQ 32B (free)", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "openrouter/rekaai/reka-flash-3", + "name": "Reka Flash 3", + "family": "reka", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "openrouter/sarvamai/sarvam-m:free", + "name": "Sarvam-M (free)", + "family": "sarvam", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2025-05-25", + "last_updated": "2025-05-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "openrouter/sourceful/riverflow-v2-fast-preview", + "name": "Riverflow V2 Fast Preview", + "family": "sourceful", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-12-08", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "openrouter/sourceful/riverflow-v2-max-preview", + "name": "Riverflow V2 Max Preview", + "family": "sourceful", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-12-08", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "openrouter/sourceful/riverflow-v2-standard-preview", + "name": "Riverflow V2 Standard Preview", + "family": "sourceful", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-12-08", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "openrouter/stepfun/step-3.5-flash", + "name": "Step 3.5 Flash", + "family": "step", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "openrouter/stepfun/step-3.5-flash:free", + "name": "Step 3.5 Flash (free)", + "family": "step", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "openrouter/thudm/glm-z1-32b:free", + "name": "GLM Z1 32B (free)", + "family": "glm-z", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "openrouter/tngtech/deepseek-r1t2-chimera:free", + "name": "DeepSeek R1T2 Chimera (free)", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-08", + "last_updated": "2025-07-08", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "openrouter/tngtech/tng-r1t-chimera:free", + "name": "R1T Chimera (free)", + "family": "tngtech", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-11-26", + "last_updated": "2026-01-31", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "openrouter/x-ai/grok-3", + "name": "Grok 3", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75, + "cache_write": 15.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "openrouter/x-ai/grok-3-beta", + "name": "Grok 3 Beta", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75, + "cache_write": 15.0 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "openrouter/x-ai/grok-3-mini", + "name": "Grok 3 Mini", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075, + "cache_write": 0.5 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "openrouter/x-ai/grok-3-mini-beta", + "name": "Grok 3 Mini Beta", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075, + "cache_write": 0.5 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "openrouter/x-ai/grok-4", + "name": "Grok 4", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75, + "cache_write": 15.0 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "openrouter/x-ai/grok-4-fast", + "name": "Grok 4 Fast", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05, + "cache_write": 0.05 + }, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "openrouter/x-ai/grok-4.1-fast", + "name": "Grok 4.1 Fast", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05, + "cache_write": 0.05 + }, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "openrouter/x-ai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + }, + "limit": { + "context": 256000, + "output": 10000 + } + }, + { + "id": "openrouter/xiaomi/mimo-v2-flash", + "name": "MiMo-V2-Flash", + "family": "mimo", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2025-12-14", + "last_updated": "2025-12-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "openrouter/z-ai/glm-4.5", + "name": "GLM 4.5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 128000, + "output": 96000 + } + }, + { + "id": "openrouter/z-ai/glm-4.5-air", + "name": "GLM 4.5 Air", + "family": "glm-air", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 1.1 + }, + "limit": { + "context": 128000, + "output": 96000 + } + }, + { + "id": "openrouter/z-ai/glm-4.5-air:free", + "name": "GLM 4.5 Air (free)", + "family": "glm-air", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 96000 + } + }, + { + "id": "openrouter/z-ai/glm-4.5v", + "name": "GLM 4.5V", + "family": "glm", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.8 + }, + "limit": { + "context": 64000, + "output": 16384 + } + }, + { + "id": "openrouter/z-ai/glm-4.6", + "name": "GLM 4.6", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "openrouter/z-ai/glm-4.6:exacto", + "name": "GLM 4.6 (exacto)", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.9, + "cache_read": 0.11 + }, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "openrouter/z-ai/glm-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "openrouter/z-ai/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.4 + }, + "limit": { + "context": 200000, + "output": 65535 + } + }, + { + "id": "openrouter/z-ai/glm-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.2, + "cache_read": 0.2 + }, + "limit": { + "context": 202752, + "output": 131000 + } + }, + { + "id": "ovhcloud/deepseek-r1-distill-llama-70b", + "name": "DeepSeek-R1-Distill-Llama-70B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-30", + "last_updated": "2025-01-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.74, + "output": 0.74 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "ovhcloud/gpt-oss-120b", + "name": "gpt-oss-120b", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.47 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "ovhcloud/gpt-oss-20b", + "name": "gpt-oss-20b", + "attachment": false, + "reasoning": true, + "tool_call": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.18 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "ovhcloud/llama-3.1-8b-instruct", + "name": "Llama-3.1-8B-Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-11", + "last_updated": "2025-06-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.11, + "output": 0.11 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "ovhcloud/meta-llama-3_3-70b-instruct", + "name": "Meta-Llama-3_3-70B-Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.74, + "output": 0.74 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "ovhcloud/mistral-7b-instruct-v0.3", + "name": "Mistral-7B-Instruct-v0.3", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.11, + "output": 0.11 + }, + "limit": { + "context": 65536, + "output": 65536 + } + }, + { + "id": "ovhcloud/mistral-nemo-instruct", + "name": "Mistral-Nemo-Instruct-2407", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-20", + "last_updated": "2024-11-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.14, + "output": 0.14 + }, + "limit": { + "context": 65536, + "output": 65536 + } + }, + { + "id": "ovhcloud/mistral-small-3.2-24b-instruct", + "name": "Mistral-Small-3.2-24B-Instruct-2506", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-16", + "last_updated": "2025-07-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.31 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "ovhcloud/mixtral-8x7b-instruct-v0.1", + "name": "Mixtral-8x7B-Instruct-v0.1", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 0.7 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "ovhcloud/qwen2.5-coder-32b-instruct", + "name": "Qwen2.5-Coder-32B-Instruct", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.96, + "output": 0.96 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "ovhcloud/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-03-31", + "last_updated": "2025-03-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.01, + "output": 1.01 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "ovhcloud/qwen3-32b", + "name": "Qwen3-32B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-16", + "last_updated": "2025-07-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.25 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "ovhcloud/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder-30B-A3B-Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.26 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "perplexity/sonar", + "name": "Sonar", + "family": "sonar", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 1.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "perplexity/sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": false, + "knowledge": "2025-01", + "release_date": "2025-02-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "perplexity/sonar-pro", + "name": "Sonar Pro", + "family": "sonar-pro", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "perplexity/sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "family": "sonar-reasoning", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "poe/anthropic/claude-haiku-3", + "name": "Claude-Haiku-3", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-03-09", + "last_updated": "2024-03-09", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.21, + "output": 1.1, + "cache_read": 0.021, + "cache_write": 0.26 + }, + "limit": { + "context": 189096, + "output": 8192 + } + }, + { + "id": "poe/anthropic/claude-haiku-3.5", + "name": "Claude-Haiku-3.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-10-01", + "last_updated": "2024-10-01", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.68, + "output": 3.4, + "cache_read": 0.068, + "cache_write": 0.85 + }, + "limit": { + "context": 189096, + "output": 8192 + } + }, + { + "id": "poe/anthropic/claude-haiku-4.5", + "name": "Claude-Haiku-4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.85, + "output": 4.3, + "cache_read": 0.085, + "cache_write": 1.1 + }, + "limit": { + "context": 192000, + "output": 64000 + } + }, + { + "id": "poe/anthropic/claude-opus-4", + "name": "Claude-Opus-4", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-05-21", + "last_updated": "2025-05-21", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 13.0, + "output": 64.0, + "cache_read": 1.3, + "cache_write": 16.0 + }, + "limit": { + "context": 192512, + "output": 28672 + } + }, + { + "id": "poe/anthropic/claude-opus-4.1", + "name": "Claude-Opus-4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 13.0, + "output": 64.0, + "cache_read": 1.3, + "cache_write": 16.0 + }, + "limit": { + "context": 196608, + "output": 32000 + } + }, + { + "id": "poe/anthropic/claude-opus-4.5", + "name": "Claude-Opus-4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-21", + "last_updated": "2025-11-21", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 4.3, + "output": 21.0, + "cache_read": 0.43, + "cache_write": 5.3 + }, + "limit": { + "context": 196608, + "output": 64000 + } + }, + { + "id": "poe/anthropic/claude-opus-4.6", + "name": "Claude-Opus-4.6", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2026-02-04", + "last_updated": "2026-02-04", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 4.3, + "output": 21.0, + "cache_read": 0.43, + "cache_write": 5.3 + }, + "limit": { + "context": 983040, + "output": 128000 + } + }, + { + "id": "poe/anthropic/claude-sonnet-3.5", + "name": "Claude-Sonnet-3.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-06-05", + "last_updated": "2024-06-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.6, + "output": 13.0, + "cache_read": 0.26, + "cache_write": 3.2 + }, + "limit": { + "context": 189096, + "output": 8192 + } + }, + { + "id": "poe/anthropic/claude-sonnet-3.5-june", + "name": "Claude-Sonnet-3.5-June", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-11-18", + "last_updated": "2024-11-18", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.6, + "output": 13.0, + "cache_read": 0.26, + "cache_write": 3.2 + }, + "limit": { + "context": 189096, + "output": 8192 + } + }, + { + "id": "poe/anthropic/claude-sonnet-3.7", + "name": "Claude-Sonnet-3.7", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.6, + "output": 13.0, + "cache_read": 0.26, + "cache_write": 3.2 + }, + "limit": { + "context": 196608, + "output": 128000 + } + }, + { + "id": "poe/anthropic/claude-sonnet-4", + "name": "Claude-Sonnet-4", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-05-21", + "last_updated": "2025-05-21", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.6, + "output": 13.0, + "cache_read": 0.26, + "cache_write": 3.2 + }, + "limit": { + "context": 983040, + "output": 64000 + } + }, + { + "id": "poe/anthropic/claude-sonnet-4.5", + "name": "Claude-Sonnet-4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-09-26", + "last_updated": "2025-09-26", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.6, + "output": 13.0, + "cache_read": 0.26, + "cache_write": 3.2 + }, + "limit": { + "context": 983040, + "output": 32768 + } + }, + { + "id": "poe/anthropic/claude-sonnet-4.6", + "name": "Claude-Sonnet-4.6", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.6, + "output": 13.0, + "cache_read": 0.26, + "cache_write": 3.2 + }, + "limit": { + "context": 983040, + "output": 128000 + } + }, + { + "id": "poe/cerebras/gpt-oss-120b-cs", + "name": "gpt-oss-120b-cs", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/cerebras/llama-3.1-8b-cs", + "name": "llama-3.1-8b-cs", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-05-13", + "last_updated": "2025-05-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/cerebras/llama-3.3-70b-cs", + "name": "llama-3.3-70b-cs", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-05-13", + "last_updated": "2025-05-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/cerebras/qwen3-235b-2507-cs", + "name": "qwen3-235b-2507-cs", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/cerebras/qwen3-32b-cs", + "name": "qwen3-32b-cs", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-05-15", + "last_updated": "2025-05-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/elevenlabs/elevenlabs-music", + "name": "ElevenLabs-Music", + "family": "elevenlabs", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-29", + "last_updated": "2025-08-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 2000, + "output": 0 + } + }, + { + "id": "poe/elevenlabs/elevenlabs-v2.5-turbo", + "name": "ElevenLabs-v2.5-Turbo", + "family": "elevenlabs", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-10-28", + "last_updated": "2024-10-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 0 + } + }, + { + "id": "poe/elevenlabs/elevenlabs-v3", + "name": "ElevenLabs-v3", + "family": "elevenlabs", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 0 + } + }, + { + "id": "poe/google/gemini-2.0-flash", + "name": "Gemini-2.0-Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.42 + }, + "limit": { + "context": 990000, + "output": 8192 + } + }, + { + "id": "poe/google/gemini-2.0-flash-lite", + "name": "Gemini-2.0-Flash-Lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.052, + "output": 0.21 + }, + "limit": { + "context": 990000, + "output": 8192 + } + }, + { + "id": "poe/google/gemini-2.5-flash", + "name": "Gemini-2.5-Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-26", + "last_updated": "2025-04-26", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 + }, + "limit": { + "context": 1065535, + "output": 65535 + } + }, + { + "id": "poe/google/gemini-2.5-flash-lite", + "name": "Gemini-2.5-Flash-Lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-06-19", + "last_updated": "2025-06-19", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 1024000, + "output": 64000 + } + }, + { + "id": "poe/google/gemini-2.5-pro", + "name": "Gemini-2.5-Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.87, + "output": 7.0, + "cache_read": 0.087 + }, + "limit": { + "context": 1065535, + "output": 65535 + } + }, + { + "id": "poe/google/gemini-3-flash", + "name": "Gemini-3-Flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-07", + "last_updated": "2025-10-07", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.4, + "cache_read": 0.04 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "poe/google/gemini-3-pro", + "name": "Gemini-3-Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-22", + "last_updated": "2025-10-22", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.6, + "output": 9.6, + "cache_read": 0.16 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "poe/google/gemini-deep-research", + "name": "gemini-deep-research", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.6, + "output": 9.6 + }, + "limit": { + "context": 1048576, + "output": 0 + } + }, + { + "id": "poe/google/imagen-3", + "name": "Imagen-3", + "family": "imagen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-10-15", + "last_updated": "2024-10-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/google/imagen-3-fast", + "name": "Imagen-3-Fast", + "family": "imagen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-10-17", + "last_updated": "2024-10-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/google/imagen-4", + "name": "Imagen-4", + "family": "imagen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/google/imagen-4-fast", + "name": "Imagen-4-Fast", + "family": "imagen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-06-25", + "last_updated": "2025-06-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/google/imagen-4-ultra", + "name": "Imagen-4-Ultra", + "family": "imagen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-05-24", + "last_updated": "2025-05-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/google/lyria", + "name": "Lyria", + "family": "lyria", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-06-04", + "last_updated": "2025-06-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/google/nano-banana", + "name": "Nano-Banana", + "family": "nano-banana", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 + }, + "limit": { + "context": 65536, + "output": 0 + } + }, + { + "id": "poe/google/nano-banana-pro", + "name": "Nano-Banana-Pro", + "family": "nano-banana", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 65536, + "output": 0 + } + }, + { + "id": "poe/google/veo-2", + "name": "Veo-2", + "family": "veo", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-12-02", + "last_updated": "2024-12-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/google/veo-3", + "name": "Veo-3", + "family": "veo", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-05-21", + "last_updated": "2025-05-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/google/veo-3-fast", + "name": "Veo-3-Fast", + "family": "veo", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-13", + "last_updated": "2025-10-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/google/veo-3.1", + "name": "Veo-3.1", + "family": "veo", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/google/veo-3.1-fast", + "name": "Veo-3.1-Fast", + "family": "veo", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "poe/ideogramai/ideogram", + "name": "Ideogram", + "family": "ideogram", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-04-03", + "last_updated": "2024-04-03", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 150, + "output": 0 + } + }, + { + "id": "poe/ideogramai/ideogram-v2", + "name": "Ideogram-v2", + "family": "ideogram", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-08-21", + "last_updated": "2024-08-21", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 150, + "output": 0 + } + }, + { + "id": "poe/ideogramai/ideogram-v2a", + "name": "Ideogram-v2a", + "family": "ideogram", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 150, + "output": 0 + } + }, + { + "id": "poe/ideogramai/ideogram-v2a-turbo", + "name": "Ideogram-v2a-Turbo", + "family": "ideogram", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 150, + "output": 0 + } + }, + { + "id": "poe/lumalabs/ray2", + "name": "Ray2", + "family": "ray", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-02-20", + "last_updated": "2025-02-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 5000, + "output": 0 + } + }, + { + "id": "poe/novita/glm-4.6", + "name": "GLM-4.6", + "family": "glm", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/novita/glm-4.6v", + "name": "glm-4.6v", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 131000, + "output": 32768 + } + }, + { + "id": "poe/novita/glm-4.7", + "name": "glm-4.7", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 205000, + "output": 131072 + } + }, + { + "id": "poe/novita/glm-4.7-flash", + "name": "glm-4.7-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 65500 + } + }, + { + "id": "poe/novita/glm-4.7-n", + "name": "glm-4.7-n", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 205000, + "output": 131072 + } + }, + { + "id": "poe/novita/kimi-k2-thinking", + "name": "kimi-k2-thinking", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 0 + } + }, + { + "id": "poe/novita/kimi-k2.5", + "name": "kimi-k2.5", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 262144 + } + }, + { + "id": "poe/novita/minimax-m2.1", + "name": "minimax-m2.1", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-26", + "last_updated": "2025-12-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 205000, + "output": 131072 + } + }, + { + "id": "poe/openai/chatgpt-4o", + "name": "ChatGPT-4o-Latest", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-08-14", + "last_updated": "2024-08-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 4.5, + "output": 14.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "poe/openai/dall-e-3", + "name": "DALL-E-3", + "family": "dall-e", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2023-11-06", + "last_updated": "2023-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 800, + "output": 0 + } + }, + { + "id": "poe/openai/gpt-3.5-turbo", + "name": "GPT-3.5-Turbo", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2023-09-13", + "last_updated": "2023-09-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.45, + "output": 1.4 + }, + "limit": { + "context": 16384, + "output": 2048 + } + }, + { + "id": "poe/openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5-Turbo-Instruct", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2023-09-20", + "last_updated": "2023-09-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.4, + "output": 1.8 + }, + "limit": { + "context": 3500, + "output": 1024 + } + }, + { + "id": "poe/openai/gpt-3.5-turbo-raw", + "name": "GPT-3.5-Turbo-Raw", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2023-09-27", + "last_updated": "2023-09-27", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.45, + "output": 1.4 + }, + "limit": { + "context": 4524, + "output": 2048 + } + }, + { + "id": "poe/openai/gpt-4-classic", + "name": "GPT-4-Classic-0314", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-08-26", + "last_updated": "2024-08-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 27.0, + "output": 54.0 + }, + "limit": { + "context": 8192, + "output": 4096 + } + }, + { + "id": "poe/openai/gpt-4-turbo", + "name": "GPT-4-Turbo", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2023-09-13", + "last_updated": "2023-09-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 9.0, + "output": 27.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "poe/openai/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "poe/openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.36, + "output": 1.4, + "cache_read": 0.09 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "poe/openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.36, + "cache_read": 0.022 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "poe/openai/gpt-4o", + "name": "GPT-4o", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "poe/openai/gpt-4o-aug", + "name": "GPT-4o-Aug", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-11-21", + "last_updated": "2024-11-21", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.2, + "output": 9.0, + "cache_read": 1.1 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "poe/openai/gpt-4o-mini", + "name": "GPT-4o-mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.54, + "cache_read": 0.068 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "poe/openai/gpt-4o-mini-search", + "name": "GPT-4o-mini-Search", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-03-11", + "last_updated": "2025-03-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.54 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "poe/openai/gpt-4o-search", + "name": "GPT-4o-Search", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-03-11", + "last_updated": "2025-03-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.2, + "output": 9.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "poe/openai/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 9.0, + "cache_read": 0.11 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5-chat", + "name": "GPT-5-Chat", + "family": "gpt-codex", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 9.0, + "cache_read": 0.11 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "poe/openai/gpt-5-codex", + "name": "GPT-5-Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 9.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5-mini", + "name": "GPT-5-mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-06-25", + "last_updated": "2025-06-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5-nano", + "name": "GPT-5-nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.045, + "output": 0.36, + "cache_read": 0.0045 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5-pro", + "name": "GPT-5-Pro", + "family": "gpt-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 14.0, + "output": 110.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5.1", + "name": "GPT-5.1", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 9.0, + "cache_read": 0.11 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 9.0, + "cache_read": 0.11 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-Max", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 9.0, + "cache_read": 0.11 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5.1-instant", + "name": "GPT-5.1-Instant", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 9.0, + "cache_read": 0.11 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "poe/openai/gpt-5.2", + "name": "GPT-5.2", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.6, + "output": 13.0, + "cache_read": 0.16 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.6, + "output": 13.0, + "cache_read": 0.16 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-5.2-instant", + "name": "GPT-5.2-Instant", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.6, + "output": 13.0, + "cache_read": 0.16 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "poe/openai/gpt-5.2-pro", + "name": "GPT-5.2-Pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 19.0, + "output": 150.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "poe/openai/gpt-image-1", + "name": "GPT-Image-1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-03-31", + "last_updated": "2025-03-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 0 + } + }, + { + "id": "poe/openai/gpt-image-1-mini", + "name": "GPT-Image-1-Mini", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/openai/gpt-image-1.5", + "name": "gpt-image-1.5", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 0 + } + }, + { + "id": "poe/openai/o1", + "name": "o1", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2024-12-18", + "last_updated": "2024-12-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 14.0, + "output": 54.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "poe/openai/o1-pro", + "name": "o1-pro", + "family": "o-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-03-19", + "last_updated": "2025-03-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 140.0, + "output": 540.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "poe/openai/o3", + "name": "o3", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "poe/openai/o3-deep-research", + "name": "o3-deep-research", + "family": "o", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 9.0, + "output": 36.0, + "cache_read": 2.2 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "poe/openai/o3-mini", + "name": "o3-mini", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.99, + "output": 4.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "poe/openai/o3-mini-high", + "name": "o3-mini-high", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.99, + "output": 4.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "poe/openai/o3-pro", + "name": "o3-pro", + "family": "o-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-06-10", + "last_updated": "2025-06-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 18.0, + "output": 72.0 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "poe/openai/o4-mini", + "name": "o4-mini", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.99, + "output": 4.0, + "cache_read": 0.25 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "poe/openai/o4-mini-deep-research", + "name": "o4-mini-deep-research", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "poe/openai/sora-2", + "name": "Sora-2", + "family": "sora", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/openai/sora-2-pro", + "name": "Sora-2-Pro", + "family": "sora", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/poetools/claude-code", + "name": "claude-code", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-27", + "last_updated": "2025-11-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 0, + "output": 0 + } + }, + { + "id": "poe/runwayml/runway", + "name": "Runway", + "family": "runway", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-10-11", + "last_updated": "2024-10-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256, + "output": 0 + } + }, + { + "id": "poe/runwayml/runway-gen-4-turbo", + "name": "Runway-Gen-4-Turbo", + "family": "runway", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-05-09", + "last_updated": "2025-05-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256, + "output": 0 + } + }, + { + "id": "poe/stabilityai/stablediffusionxl", + "name": "StableDiffusionXL", + "family": "stable-diffusion", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2023-07-09", + "last_updated": "2023-07-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200, + "output": 0 + } + }, + { + "id": "poe/topazlabs-co/topazlabs", + "name": "TopazLabs", + "family": "topazlabs", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 204, + "output": 0 + } + }, + { + "id": "poe/trytako/tako", + "name": "Tako", + "family": "tako", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 2048, + "output": 0 + } + }, + { + "id": "poe/xai/grok-3", + "name": "Grok 3", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "poe/xai/grok-3-mini", + "name": "Grok 3 Mini", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "poe/xai/grok-4", + "name": "Grok-4", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-07-10", + "last_updated": "2025-07-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 + }, + "limit": { + "context": 256000, + "output": 128000 + } + }, + { + "id": "poe/xai/grok-4-fast", + "name": "Grok-4-Fast-Reasoning", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-09-16", + "last_updated": "2025-09-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "limit": { + "context": 2000000, + "output": 128000 + } + }, + { + "id": "poe/xai/grok-4-fast-non", + "name": "Grok-4-Fast-Non-Reasoning", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-09-16", + "last_updated": "2025-09-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "limit": { + "context": 2000000, + "output": 128000 + } + }, + { + "id": "poe/xai/grok-4.1-fast", + "name": "Grok-4.1-Fast-Reasoning", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "poe/xai/grok-4.1-fast-non", + "name": "Grok-4.1-Fast-Non-Reasoning", + "family": "grok", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 2000000, + "output": 30000 + } + }, + { + "id": "poe/xai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "release_date": "2025-08-22", + "last_updated": "2025-08-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + }, + "limit": { + "context": 256000, + "output": 128000 + } + }, + { + "id": "privatemode-ai/gemma-3-27b", + "name": "Gemma 3 27B", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "privatemode-ai/gpt-oss-120b", + "name": "gpt-oss-120b", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "privatemode-ai/qwen3-coder-30b-a3b", + "name": "Qwen3-Coder 30B-A3B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "privatemode-ai/qwen3-embedding-4b", + "name": "Qwen3-Embedding 4B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-06-06", + "last_updated": "2025-06-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32000, + "output": 2560 + } + }, + { + "id": "privatemode-ai/whisper-large-v3", + "name": "Whisper large-v3", + "family": "whisper", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2023-09-01", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 0, + "output": 4096 + } + }, + { + "id": "qihang-ai/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.71 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "qihang-ai/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.71, + "output": 3.57 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "qihang-ai/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.43, + "output": 2.14 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "qihang-ai/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.71 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "qihang-ai/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.43 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "qihang-ai/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.57, + "output": 3.43 + }, + "limit": { + "context": 1000000, + "output": 65000 + } + }, + { + "id": "qihang-ai/gpt-5-mini", + "name": "GPT-5-Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.04, + "output": 0.29 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "qihang-ai/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "qihang-ai/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 1.14 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "qiniu-ai/MiniMax-M1", + "name": "MiniMax M1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 1000000, + "output": 80000 + } + }, + { + "id": "qiniu-ai/claude-3.5-haiku", + "name": "Claude 3.5 Haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "qiniu-ai/claude-3.5-sonnet", + "name": "Claude 3.5 Sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-09", + "last_updated": "2025-09-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 8200 + } + }, + { + "id": "qiniu-ai/claude-3.7-sonnet", + "name": "Claude 3.7 Sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "qiniu-ai/claude-4.0-opus", + "name": "Claude 4.0 Opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/claude-4.0-sonnet", + "name": "Claude 4.0 Sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "qiniu-ai/claude-4.1-opus", + "name": "Claude 4.1 Opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/claude-4.5-haiku", + "name": "Claude 4.5 Haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-16", + "last_updated": "2025-10-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "qiniu-ai/claude-4.5-opus", + "name": "Claude 4.5 Opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 200000 + } + }, + { + "id": "qiniu-ai/claude-4.5-sonnet", + "name": "Claude 4.5 Sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "qiniu-ai/deepseek-r1", + "name": "DeepSeek-R1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/deepseek-v3", + "name": "DeepSeek-V3-0324", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 16000 + } + }, + { + "id": "qiniu-ai/deepseek-v3.1", + "name": "DeepSeek-V3.1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-19", + "last_updated": "2025-08-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/deepseek/deepseek-math-v2", + "name": "Deepseek/Deepseek-Math-V2", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-12-04", + "last_updated": "2025-12-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 160000, + "output": 160000 + } + }, + { + "id": "qiniu-ai/deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek/DeepSeek-V3.1-Terminus", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/deepseek/deepseek-v3.1-terminus-thinking", + "name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/deepseek/deepseek-v3.2-251201", + "name": "Deepseek/DeepSeek-V3.2", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/deepseek/deepseek-v3.2-exp", + "name": "DeepSeek/DeepSeek-V3.2-Exp", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/deepseek/deepseek-v3.2-exp-thinking", + "name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/doubao-1.5-pro-32k", + "name": "Doubao 1.5 Pro 32k", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 12000 + } + }, + { + "id": "qiniu-ai/doubao-1.5-thinking-pro", + "name": "Doubao 1.5 Thinking Pro", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 16000 + } + }, + { + "id": "qiniu-ai/doubao-1.5-vision-pro", + "name": "Doubao 1.5 Vision Pro", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 16000 + } + }, + { + "id": "qiniu-ai/doubao-seed-1.6", + "name": "Doubao-Seed 1.6", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/doubao-seed-1.6-flash", + "name": "Doubao-Seed 1.6 Flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/doubao-seed-1.6-thinking", + "name": "Doubao-Seed 1.6 Thinking", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", + "modalities": { + "input": [ + "image", + "text", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "qiniu-ai/gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "qiniu-ai/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 1048576, + "output": 64000 + } + }, + { + "id": "qiniu-ai/gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-10-22", + "last_updated": "2025-10-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "qiniu-ai/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 1048576, + "output": 64000 + } + }, + { + "id": "qiniu-ai/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "qiniu-ai/gemini-3.0-flash-preview", + "name": "Gemini 3.0 Flash Preview", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "qiniu-ai/gemini-3.0-pro-image-preview", + "name": "Gemini 3.0 Pro Image Preview", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-20", + "last_updated": "2025-11-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "qiniu-ai/gemini-3.0-pro-preview", + "name": "Gemini 3.0 Pro Preview", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "modalities": { + "input": [ + "text", + "image", + "video", + "pdf", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "qiniu-ai/glm-4.5", + "name": "GLM 4.5", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 131072, + "output": 98304 + } + }, + { + "id": "qiniu-ai/glm-4.5-air", + "name": "GLM 4.5 Air", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 131000, + "output": 4096 + } + }, + { + "id": "qiniu-ai/gpt-oss-120b", + "name": "gpt-oss-120b", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "qiniu-ai/gpt-oss-20b", + "name": "gpt-oss-20b", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "qiniu-ai/kimi-k2", + "name": "Kimi K2", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "qiniu-ai/kling-v2-6", + "name": "Kling-V2 6", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2026-01-13", + "last_updated": "2026-01-13", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "video" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 99999999, + "output": 99999999 + } + }, + { + "id": "qiniu-ai/meituan/longcat-flash-chat", + "name": "Meituan/Longcat-Flash-Chat", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-11-05", + "last_updated": "2025-11-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "qiniu-ai/mimo-v2-flash", + "name": "Mimo-V2-Flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "qiniu-ai/minimax/minimax-m2", + "name": "Minimax/Minimax-M2", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 128000 + } + }, + { + "id": "qiniu-ai/minimax/minimax-m2.1", + "name": "Minimax/Minimax-M2.1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 204800, + "output": 128000 + } + }, + { + "id": "qiniu-ai/moonshotai/kimi-k2", + "name": "Kimi K2 0905", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-08", + "last_updated": "2025-09-08", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 100000 + } + }, + { + "id": "qiniu-ai/moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 100000 + } + }, + { + "id": "qiniu-ai/openai/gpt-5", + "name": "OpenAI/GPT-5", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "qiniu-ai/openai/gpt-5.2", + "name": "OpenAI/GPT-5.2", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "qiniu-ai/qwen-max", + "name": "Qwen2.5-Max-2025-01-25", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "qiniu-ai/qwen-turbo", + "name": "Qwen-Turbo", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 1000000, + "output": 4096 + } + }, + { + "id": "qiniu-ai/qwen-vl-max", + "name": "Qwen VL-MAX-2025-01-25", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "qiniu-ai/qwen2.5-vl-72b-instruct", + "name": "Qwen 2.5 VL 72B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "qiniu-ai/qwen2.5-vl-7b-instruct", + "name": "Qwen 2.5 VL 7B Instruct", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "qiniu-ai/qwen3-235b-a22b", + "name": "Qwen 3 235B A22B", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "qiniu-ai/qwen3-235b-a22b-instruct", + "name": "Qwen3 235b A22B Instruct 2507", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 262144, + "output": 64000 + } + }, + { + "id": "qiniu-ai/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 262144, + "output": 4096 + } + }, + { + "id": "qiniu-ai/qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 40000, + "output": 4096 + } + }, + { + "id": "qiniu-ai/qwen3-32b", + "name": "Qwen3 32B", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 40000, + "output": 4096 + } + }, + { + "id": "qiniu-ai/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-14", + "last_updated": "2025-08-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 262000, + "output": 4096 + } + }, + { + "id": "qiniu-ai/qwen3-max", + "name": "Qwen3 Max", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "qiniu-ai/qwen3-max-preview", + "name": "Qwen3 Max Preview", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-06", + "last_updated": "2025-09-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "qiniu-ai/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-12", + "last_updated": "2025-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "qiniu-ai/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-12", + "last_updated": "2025-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "qiniu-ai/stepfun-ai/gelab-zero-4b-preview", + "name": "Stepfun-Ai/Gelab Zero 4b Preview", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 8192, + "output": 4096 + } + }, + { + "id": "qiniu-ai/x-ai/grok-4-fast", + "name": "x-AI/Grok-4-Fast", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-20", + "last_updated": "2025-09-20", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "qiniu-ai/x-ai/grok-4-fast-non", + "name": "X-Ai/Grok-4-Fast-Non-Reasoning", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "qiniu-ai/x-ai/grok-4.1-fast", + "name": "x-AI/Grok-4.1-Fast", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-20", + "last_updated": "2025-11-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "qiniu-ai/x-ai/grok-4.1-fast-non", + "name": "X-Ai/Grok 4.1 Fast Non Reasoning", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-19", + "last_updated": "2025-12-19", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 2000000, + "output": 2000000 + } + }, + { + "id": "qiniu-ai/x-ai/grok-code-fast-1", + "name": "x-AI/Grok-Code-Fast 1", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-02", + "last_updated": "2025-09-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 10000 + } + }, + { + "id": "qiniu-ai/z-ai/autoglm-phone-9b", + "name": "Z-Ai/Autoglm Phone 9b", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 12800, + "output": 4096 + } + }, + { + "id": "qiniu-ai/z-ai/glm-4.6", + "name": "Z-AI/GLM 4.6", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 200000 + } + }, + { + "id": "qiniu-ai/z-ai/glm-4.7", + "name": "Z-Ai/GLM 4.7", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 200000, + "output": 200000 + } + }, + { + "id": "requesty/anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-01", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "requesty/anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-01", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 62000 + } + }, + { + "id": "requesty/anthropic/claude-opus-4", + "name": "Claude Opus 4", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "requesty/anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "requesty/anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "requesty/anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "requesty/anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "requesty/google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.55 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "requesty/google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31, + "cache_write": 2.375 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "requesty/google/gemini-3-flash-preview", + "name": "Gemini 3 Flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0, + "cache_read": 0.05, + "cache_write": 1.0 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "requesty/google/gemini-3-pro-preview", + "name": "Gemini 3 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2, + "cache_write": 4.5 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "requesty/openai/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "requesty/openai/gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, + "limit": { + "context": 1047576, + "output": 32768 + } + }, + { + "id": "requesty/openai/gpt-4o-mini", + "name": "GPT-4o Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "requesty/openai/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "audio", + "image", + "video" + ], + "output": [ + "text", + "audio", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "requesty/openai/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.03 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "requesty/openai/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + }, + "limit": { + "context": 16000, + "output": 4000 + } + }, + { + "id": "requesty/openai/o4-mini", + "name": "o4 Mini", + "family": "o-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + }, + "limit": { + "context": 200000, + "output": 100000 + } + }, + { + "id": "requesty/xai/grok-4", + "name": "Grok 4", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-09", + "last_updated": "2025-09-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.75, + "cache_write": 3.0 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "requesty/xai/grok-4-fast", + "name": "Grok 4 Fast", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05, + "cache_write": 0.2 + }, + "limit": { + "context": 2000000, + "output": 64000 + } + }, + { + "id": "sap-ai-core/anthropic--claude-3-haiku", + "name": "anthropic--claude-3-haiku", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "sap-ai-core/anthropic--claude-3-opus", + "name": "anthropic--claude-3-opus", + "family": "claude-opus", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "sap-ai-core/anthropic--claude-3-sonnet", + "name": "anthropic--claude-3-sonnet", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "sap-ai-core/anthropic--claude-3.5-sonnet", + "name": "anthropic--claude-3.5-sonnet", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "sap-ai-core/anthropic--claude-3.7-sonnet", + "name": "anthropic--claude-3.7-sonnet", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-31", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "sap-ai-core/anthropic--claude-4-opus", + "name": "anthropic--claude-4-opus", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "sap-ai-core/anthropic--claude-4-sonnet", + "name": "anthropic--claude-4-sonnet", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "sap-ai-core/anthropic--claude-4.5-haiku", + "name": "anthropic--claude-4.5-haiku", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "sap-ai-core/anthropic--claude-4.5-opus", + "name": "anthropic--claude-4.5-opus", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04-30", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "sap-ai-core/anthropic--claude-4.5-sonnet", + "name": "anthropic--claude-4.5-sonnet", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "sap-ai-core/gemini-2.5-flash", + "name": "gemini-2.5-flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.03 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "sap-ai-core/gemini-2.5-pro", + "name": "gemini-2.5-pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "sap-ai-core/gpt-5", + "name": "gpt-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "sap-ai-core/gpt-5-mini", + "name": "gpt-5-mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "sap-ai-core/gpt-5-nano", + "name": "gpt-5-nano", + "family": "gpt-nano", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + }, + "limit": { + "context": 400000, + "output": 128000 + } + }, + { + "id": "scaleway/bge-multilingual-gemma2", + "name": "BGE Multilingual Gemma2", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-07-26", + "last_updated": "2025-06-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.13, + "output": 0.0 + }, + "limit": { + "context": 8191, + "output": 3072 + } + }, + { + "id": "scaleway/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.9, + "output": 0.9 + }, + "limit": { + "context": 32000, + "output": 4096 + } + }, + { + "id": "scaleway/devstral-2-123b-instruct", + "name": "Devstral 2 123B Instruct (2512)", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-07", + "last_updated": "2026-01-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 256000, + "output": 8192 + } + }, + { + "id": "scaleway/gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "family": "gemma", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 0.5 + }, + "limit": { + "context": 40000, + "output": 8192 + } + }, + { + "id": "scaleway/gpt-oss-120b", + "name": "GPT-OSS 120B", + "family": "gpt-oss", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "scaleway/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 128000, + "output": 16384 + } + }, + { + "id": "scaleway/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.9, + "output": 0.9 + }, + "limit": { + "context": 100000, + "output": 4096 + } + }, + { + "id": "scaleway/mistral-nemo-instruct", + "name": "Mistral Nemo Instruct 2407", + "family": "mistral-nemo", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-25", + "last_updated": "2024-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "scaleway/mistral-small-3.2-24b-instruct", + "name": "Mistral Small 3.2 24B Instruct (2506)", + "family": "mistral-small", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-20", + "last_updated": "2025-06-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.35 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "scaleway/pixtral-12b", + "name": "Pixtral 12B 2409", + "family": "pixtral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "scaleway/qwen3-235b-a22b-instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.75, + "output": 2.25 + }, + "limit": { + "context": 260000, + "output": 8192 + } + }, + { + "id": "scaleway/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "scaleway/voxtral-small-24b", + "name": "Voxtral Small 24B 2507", + "family": "voxtral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "modalities": { + "input": [ + "text", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.35 + }, + "limit": { + "context": 32000, + "output": 8192 + } + }, + { + "id": "scaleway/whisper-large-v3", + "name": "Whisper Large v3", + "family": "whisper", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.003, + "output": 0.0 + }, + "limit": { + "context": 0, + "output": 4096 + } + }, + { + "id": "siliconflow-cn/ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "family": "seed", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.21, + "output": 0.57 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Kwaipilot/KAT-Dev", + "name": "Kwaipilot/KAT-Dev", + "family": "kat-coder", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-27", + "last_updated": "2026-01-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "siliconflow-cn/PaddlePaddle/PaddleOCR-VL", + "name": "PaddlePaddle/PaddleOCR-VL", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-10-16", + "last_updated": "2025-10-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "siliconflow-cn/PaddlePaddle/PaddleOCR-VL-1.5", + "name": "PaddlePaddle/PaddleOCR-VL-1.5", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 16384, + "output": 16384 + } + }, + { + "id": "siliconflow-cn/Pro/MiniMaxAI/MiniMax-M2.1", + "name": "Pro/MiniMaxAI/MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 197000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/Pro/MiniMaxAI/MiniMax-M2.5", + "name": "Pro/MiniMaxAI/MiniMax-M2.5", + "family": "minimax", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.22 + }, + "limit": { + "context": 192000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/Pro/deepseek-ai/DeepSeek-R1", + "name": "Pro/deepseek-ai/DeepSeek-R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-05-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.18 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow-cn/Pro/deepseek-ai/DeepSeek-V3", + "name": "Pro/deepseek-ai/DeepSeek-V3", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-26", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow-cn/Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow-cn/Pro/deepseek-ai/DeepSeek-V3.2", + "name": "Pro/deepseek-ai/DeepSeek-V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.42 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow-cn/Pro/moonshotai/Kimi-K2-Instruct", + "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-08", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Pro/moonshotai/Kimi-K2-Thinking", + "name": "Pro/moonshotai/Kimi-K2-Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-07", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.55, + "output": 2.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Pro/moonshotai/Kimi-K2.5", + "name": "Pro/moonshotai/Kimi-K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.55, + "output": 3.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Pro/zai-org/GLM-4.7", + "name": "Pro/zai-org/GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 205000, + "output": 205000 + } + }, + { + "id": "siliconflow-cn/Pro/zai-org/GLM-5", + "name": "Pro/zai-org/GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 3.2 + }, + "limit": { + "context": 205000, + "output": 205000 + } + }, + { + "id": "siliconflow-cn/Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-06", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.58 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-19", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.18 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.59, + "output": 0.59 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.59, + "output": 0.59 + }, + "limit": { + "context": 131000, + "output": 4000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.05 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-11", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.18 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-24", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.27 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.59, + "output": 0.59 + }, + "limit": { + "context": 131000, + "output": 4000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-235B-A22B-Instruct", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-23", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.6 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-235B-A22B-Thinking", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.13, + "output": 0.6 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-30B-A3B-Instruct", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.3 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-30B-A3B-Thinking", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.3 + }, + "limit": { + "context": 262000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.06, + "output": 0.06 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-01", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 1.4 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4 + }, + "limit": { + "context": 66000, + "output": 66000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4 + }, + "limit": { + "context": 66000, + "output": 66000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4 + }, + "limit": { + "context": 66000, + "output": 66000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.45, + "output": 3.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-05", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.29, + "output": 1.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-11", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.29, + "output": 1.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 1.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.68 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 2.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/THUDM/GLM-4-32B", + "name": "THUDM/GLM-4-32B-0414", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.27 + }, + "limit": { + "context": 33000, + "output": 33000 + } + }, + { + "id": "siliconflow-cn/THUDM/GLM-4-9B", + "name": "THUDM/GLM-4-9B-0414", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.086, + "output": 0.086 + }, + "limit": { + "context": 33000, + "output": 33000 + } + }, + { + "id": "siliconflow-cn/THUDM/GLM-Z1-32B", + "name": "THUDM/GLM-Z1-32B-0414", + "family": "glm-z", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/THUDM/GLM-Z1-9B", + "name": "THUDM/GLM-Z1-9B-0414", + "family": "glm-z", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.086, + "output": 0.086 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/ascend-tribe/pangu-pro-moe", + "name": "ascend-tribe/pangu-pro-moe", + "family": "pangu", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "release_date": "2025-07-02", + "last_updated": "2026-01-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "siliconflow-cn/baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "family": "ernie", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-02", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.28, + "output": 1.1 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/deepseek-ai/DeepSeek-OCR", + "name": "deepseek-ai/DeepSeek-OCR", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-10-20", + "last_updated": "2025-10-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 8192 + } + }, + { + "id": "siliconflow-cn/deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-05-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.18 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow-cn/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.18 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-26", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow-cn/deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow-cn/deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.42 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow-cn/deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "family": "deepseek", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-13", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 4000, + "output": 4000 + } + }, + { + "id": "siliconflow-cn/inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "family": "ling", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "family": "ling", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-10", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "family": "ring", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/moonshotai/Kimi-K2-Instruct", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-08", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-07", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.55, + "output": 2.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/stepfun-ai/Step-3.5-Flash", + "name": "stepfun-ai/Step-3.5-Flash", + "family": "step", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow-cn/tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "family": "hunyuan", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "family": "hunyuan", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 33000, + "output": 33000 + } + }, + { + "id": "siliconflow-cn/zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "family": "glm-air", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.86 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow-cn/zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "family": "glm", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-13", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.86 + }, + "limit": { + "context": 66000, + "output": 66000 + } + }, + { + "id": "siliconflow-cn/zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 1.9 + }, + "limit": { + "context": 205000, + "output": 205000 + } + }, + { + "id": "siliconflow-cn/zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "family": "glm", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-07", + "last_updated": "2025-12-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "family": "seed", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.21, + "output": 0.57 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/MiniMaxAI/MiniMax-M2.1", + "name": "MiniMaxAI/MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 197000, + "output": 131000 + } + }, + { + "id": "siliconflow/Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-06", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.58 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow/Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-19", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.18 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow/Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.59, + "output": 0.59 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow/Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.59, + "output": 0.59 + }, + "limit": { + "context": 131000, + "output": 4000 + } + }, + { + "id": "siliconflow/Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.05 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow/Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-11", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.18 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow/Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-03-24", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.27 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.59, + "output": 0.59 + }, + "limit": { + "context": 131000, + "output": 4000 + } + }, + { + "id": "siliconflow/Qwen/Qwen2.5-VL-7B-Instruct", + "name": "Qwen/Qwen2.5-VL-7B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.05 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-235B-A22B", + "name": "Qwen/Qwen3-235B-A22B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.35, + "output": 1.42 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-235B-A22B-Instruct", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-23", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.6 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-235B-A22B-Thinking", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.13, + "output": 0.6 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-30B-A3B-Instruct", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.3 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-30B-A3B-Thinking", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.09, + "output": 0.3 + }, + "limit": { + "context": 262000, + "output": 131000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.06, + "output": 0.06 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-01", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 1.4 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-25", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4 + }, + "limit": { + "context": 66000, + "output": 66000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4 + }, + "limit": { + "context": 66000, + "output": 66000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4 + }, + "limit": { + "context": 66000, + "output": 66000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.45, + "output": 3.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-05", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.29, + "output": 1.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-11", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.29, + "output": 1.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 1.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.68 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 2.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/THUDM/GLM-4-32B", + "name": "THUDM/GLM-4-32B-0414", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.27 + }, + "limit": { + "context": 33000, + "output": 33000 + } + }, + { + "id": "siliconflow/THUDM/GLM-4-9B", + "name": "THUDM/GLM-4-9B-0414", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.086, + "output": 0.086 + }, + "limit": { + "context": 33000, + "output": 33000 + } + }, + { + "id": "siliconflow/THUDM/GLM-Z1-32B", + "name": "THUDM/GLM-Z1-32B-0414", + "family": "glm-z", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/THUDM/GLM-Z1-9B", + "name": "THUDM/GLM-Z1-9B-0414", + "family": "glm-z", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.086, + "output": 0.086 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "family": "ernie", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-02", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.28, + "output": 1.1 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-05-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.18 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.18, + "output": 0.18 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-26", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow/deepseek-ai/DeepSeek-V3.1", + "name": "deepseek-ai/DeepSeek-V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-25", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow/deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow/deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.42 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow/deepseek-ai/DeepSeek-V3.2-Exp", + "name": "deepseek-ai/DeepSeek-V3.2-Exp", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-10", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.41 + }, + "limit": { + "context": 164000, + "output": 164000 + } + }, + { + "id": "siliconflow/deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "family": "deepseek", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-13", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 4000, + "output": 4000 + } + }, + { + "id": "siliconflow/inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "family": "ling", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "family": "ling", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-10", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.28 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "family": "ring", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-04-23", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.06, + "output": 0.06 + }, + "limit": { + "context": 33000, + "output": 4000 + } + }, + { + "id": "siliconflow/moonshotai/Kimi-K2-Instruct", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-08", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-11-07", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.55, + "output": 2.5 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/moonshotai/Kimi-K2.5", + "name": "moonshotai/Kimi-K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.55, + "output": 3.0 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/nex-agi/DeepSeek-V3.1-Nex-N1", + "name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-01-01", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.0 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/openai/gpt-oss-120b", + "name": "openai/gpt-oss-120b", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-13", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.45 + }, + "limit": { + "context": 131000, + "output": 8000 + } + }, + { + "id": "siliconflow/openai/gpt-oss-20b", + "name": "openai/gpt-oss-20b", + "family": "gpt-oss", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-13", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.04, + "output": 0.18 + }, + "limit": { + "context": 131000, + "output": 8000 + } + }, + { + "id": "siliconflow/stepfun-ai/Step-3.5-Flash", + "name": "stepfun-ai/Step-3.5-Flash", + "family": "step", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 262000, + "output": 262000 + } + }, + { + "id": "siliconflow/tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "family": "hunyuan", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.57 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "family": "hunyuan", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 33000, + "output": 33000 + } + }, + { + "id": "siliconflow/zai-org/GLM-4.5", + "name": "zai-org/GLM-4.5", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.0 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "family": "glm-air", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.86 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "family": "glm", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-13", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.14, + "output": 0.86 + }, + "limit": { + "context": 66000, + "output": 66000 + } + }, + { + "id": "siliconflow/zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 1.9 + }, + "limit": { + "context": 205000, + "output": 205000 + } + }, + { + "id": "siliconflow/zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "family": "glm", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-07", + "last_updated": "2025-12-07", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "siliconflow/zai-org/GLM-4.7", + "name": "zai-org/GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 205000, + "output": 205000 + } + }, + { + "id": "siliconflow/zai-org/GLM-5", + "name": "zai-org/GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 3.2 + }, + "limit": { + "context": 205000, + "output": 205000 + } + }, + { + "id": "stackit/Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", + "name": "Qwen3-VL 235B", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.64, + "output": 1.91 + }, + "limit": { + "context": 218000, + "output": 8192 + } + }, + { + "id": "stackit/Qwen/Qwen3-VL-Embedding-8B", + "name": "Qwen3-VL Embedding 8B", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 0.09 + }, + "limit": { + "context": 32000, + "output": 4096 + } + }, + { + "id": "stackit/cortecs/Llama-3.3-70B-Instruct-FP8-Dynamic", + "name": "Llama 3.3 70B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.49, + "output": 0.71 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "stackit/google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2025-05-17", + "last_updated": "2025-05-17", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.49, + "output": 0.71 + }, + "limit": { + "context": 37000, + "output": 8192 + } + }, + { + "id": "stackit/intfloat/e5-mistral-7b-instruct", + "name": "E5 Mistral 7B", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.02, + "output": 0.02 + }, + "limit": { + "context": 4096, + "output": 4096 + } + }, + { + "id": "stackit/neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8", + "name": "Llama 3.1 8B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.16, + "output": 0.27 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "stackit/neuralmagic/Mistral-Nemo-Instruct-2407-FP8", + "name": "Mistral Nemo", + "family": "mistral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-01", + "last_updated": "2024-07-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.49, + "output": 0.71 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "stackit/openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "family": "gpt", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.49, + "output": 0.71 + }, + "limit": { + "context": 131000, + "output": 8192 + } + }, + { + "id": "stepfun/step-1-32k", + "name": "Step 1 (32K)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-01-01", + "last_updated": "2026-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.05, + "output": 9.59, + "cache_read": 0.41 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "stepfun/step-2-16k", + "name": "Step 2 (16K)", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2025-01-01", + "last_updated": "2026-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.21, + "output": 16.44, + "cache_read": 1.04 + }, + "limit": { + "context": 16384, + "output": 8192 + } + }, + { + "id": "stepfun/step-3.5-flash", + "name": "Step 3.5 Flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "submodel/Qwen/Qwen3-235B-A22B-Instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.3 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "submodel/Qwen/Qwen3-235B-A22B-Thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 262144, + "output": 131072 + } + }, + { + "id": "submodel/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "submodel/deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1 0528", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 2.15 + }, + "limit": { + "context": 75000, + "output": 163840 + } + }, + { + "id": "submodel/deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3 0324", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 75000, + "output": 163840 + } + }, + { + "id": "submodel/deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 75000, + "output": 163840 + } + }, + { + "id": "submodel/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.5 + }, + "limit": { + "context": 131072, + "output": 32768 + } + }, + { + "id": "submodel/zai-org/GLM-4.5-Air", + "name": "GLM 4.5 Air", + "family": "glm-air", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.5 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "submodel/zai-org/GLM-4.5-FP8", + "name": "GLM 4.5 FP8", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.8 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "synthetic/hf:MiniMaxAI/MiniMax-M2", + "name": "MiniMax-M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.19 + }, + "limit": { + "context": 196608, + "output": 131000 + } + }, + { + "id": "synthetic/hf:MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.19 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "synthetic/hf:Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5-Coder-32B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.8, + "output": 0.8 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "synthetic/hf:Qwen/Qwen3-235B-A22B-Instruct", + "name": "Qwen 3 235B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "synthetic/hf:Qwen/Qwen3-235B-A22B-Thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.65, + "output": 3.0 + }, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "synthetic/hf:Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen 3 Coder 480B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 2.0 + }, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "synthetic/hf:deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1 (0528)", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 8.0 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "synthetic/hf:deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3 (0324)", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.2, + "output": 1.2 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "synthetic/hf:deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.56, + "output": 1.68 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "synthetic/hf:deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.2, + "output": 1.2 + }, + "limit": { + "context": 128000, + "output": 128000 + } + }, + { + "id": "synthetic/hf:deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 0.4, + "cache_read": 0.27, + "cache_write": 0.0 + }, + "limit": { + "context": 162816, + "output": 8000 + } + }, + { + "id": "synthetic/hf:meta-llama/Llama-3.1-405B-Instruct", + "name": "Llama-3.1-405B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 3.0, + "output": 3.0 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "synthetic/hf:meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama-3.1-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.9, + "output": 0.9 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "synthetic/hf:meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama-3.1-8B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "synthetic/hf:meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.9, + "output": 0.9 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "synthetic/hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.22, + "output": 0.88 + }, + "limit": { + "context": 524000, + "output": 4096 + } + }, + { + "id": "synthetic/hf:meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama-4-Scout-17B-16E-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 328000, + "output": 4096 + } + }, + { + "id": "synthetic/hf:moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2 0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.2, + "output": 1.2 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "synthetic/hf:moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2025-11-07", + "last_updated": "2025-11-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.19 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "synthetic/hf:moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.19 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "synthetic/hf:nvidia/Kimi-K2.5-NVFP4", + "name": "Kimi K2.5 (NVFP4)", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.19 + }, + "limit": { + "context": 262144, + "output": 65536 + } + }, + { + "id": "synthetic/hf:openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "synthetic/hf:zai-org/GLM-4.6", + "name": "GLM 4.6", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.19 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "synthetic/hf:zai-org/GLM-4.7", + "name": "GLM 4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.19 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "togetherai/MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 1.2 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "togetherai/Qwen/Qwen3-235B-A22B-Instruct-2507-tput", + "name": "Qwen3 235B A22B Instruct 2507 FP8", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "togetherai/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 2.0, + "output": 2.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "togetherai/Qwen/Qwen3-Coder-Next-FP8", + "name": "Qwen3 Coder Next FP8", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2026-02-03", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 1.2 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "togetherai/Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 1.5 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "togetherai/Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5 397B A17B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 3.6 + }, + "limit": { + "context": 262144, + "output": 130000 + } + }, + { + "id": "togetherai/deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-03-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 3.0, + "output": 7.0 + }, + "limit": { + "context": 163839, + "output": 163839 + } + }, + { + "id": "togetherai/deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.25, + "output": 1.25 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "togetherai/deepseek-ai/DeepSeek-V3-1", + "name": "DeepSeek V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.7 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "togetherai/essentialai/Rnj-1-Instruct", + "name": "Rnj-1 Instruct", + "family": "rnj", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-12-05", + "last_updated": "2025-12-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "togetherai/meta-llama/Llama-3.3-70B-Instruct-Turbo", + "name": "Llama 3.3 70B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.88, + "output": 0.88 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "togetherai/moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2 Instruct-0905", + "family": "kimi", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "togetherai/moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.2, + "output": 4.0 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "togetherai/moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2026-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 2.8 + }, + "limit": { + "context": 262144, + "output": 262144 + } + }, + { + "id": "togetherai/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "togetherai/zai-org/GLM-4.6", + "name": "GLM 4.6", + "family": "glm", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 2.2 + }, + "limit": { + "context": 200000, + "output": 200000 + } + }, + { + "id": "togetherai/zai-org/GLM-4.7", + "name": "GLM-4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.45, + "output": 2.0 + }, + "limit": { + "context": 200000, + "output": 200000 + } + }, + { + "id": "togetherai/zai-org/GLM-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-11", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.2 + }, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "upstage/solar-mini", + "name": "solar-mini", + "family": "solar-mini", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-06-12", + "last_updated": "2025-04-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 32768, + "output": 4096 + } + }, + { + "id": "upstage/solar-pro2", + "name": "solar-pro2", + "family": "solar-pro", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 0.25 + }, + "limit": { + "context": 65536, + "output": 8192 + } + }, + { + "id": "upstage/solar-pro3", + "name": "solar-pro3", + "family": "solar-pro", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2026-01", + "last_updated": "2026-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 0.25 + }, + "limit": { + "context": 131072, + "output": 8192 + } + }, + { + "id": "v0/v0-1.0-md", + "name": "v0-1.0-md", + "family": "v0", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "v0/v0-1.5-lg", + "name": "v0-1.5-lg", + "family": "v0", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-09", + "last_updated": "2025-06-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0 + }, + "limit": { + "context": 512000, + "output": 32000 + } + }, + { + "id": "v0/v0-1.5-md", + "name": "v0-1.5-md", + "family": "v0", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-06-09", + "last_updated": "2025-06-09", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-05", + "last_updated": "2026-02-18", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 6.0, + "output": 30.0, + "cache_read": 0.6, + "cache_write": 7.5 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "venice/claude-opus-45", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-12-06", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 6.0, + "output": 30.0, + "cache_read": 0.6, + "cache_write": 7.5 + }, + "limit": { + "context": 198000, + "output": 49500 + } + }, + { + "id": "venice/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-17", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.75, + "output": 18.75, + "cache_read": 0.375, + "cache_write": 4.69 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "venice/claude-sonnet-45", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-01-15", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.75, + "output": 18.75, + "cache_read": 0.375, + "cache_write": 4.69 + }, + "limit": { + "context": 198000, + "output": 49500 + } + }, + { + "id": "venice/deepseek-v3.2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2025-10", + "release_date": "2025-12-04", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.0, + "cache_read": 0.2 + }, + "limit": { + "context": 160000, + "output": 40000 + } + }, + { + "id": "venice/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-12-19", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.7, + "output": 3.75, + "cache_read": 0.07 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-12-02", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 15.0, + "cache_read": 0.625 + }, + "limit": { + "context": 198000, + "output": 49500 + } + }, + { + "id": "venice/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 15.0, + "cache_read": 0.5, + "cache_write": 0.5 + }, + "limit": { + "context": 1000000, + "output": 250000 + } + }, + { + "id": "venice/google-gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "family": "gemma", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-11-04", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.12, + "output": 0.2 + }, + "limit": { + "context": 198000, + "output": 49500 + } + }, + { + "id": "venice/grok-41-fast", + "name": "Grok 4.1 Fast", + "family": "grok", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-12-01", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 1.25, + "cache_read": 0.125 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/grok-code-fast-1", + "name": "Grok Code Fast 1", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-01", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.87, + "cache_read": 0.03 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/hermes-3-llama-3.1-405b", + "name": "Hermes 3 Llama 3.1 405b", + "family": "hermes", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-09-25", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.1, + "output": 3.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/kimi-k2-5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2026-01-27", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.75, + "output": 3.75, + "cache_read": 0.125 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04", + "release_date": "2025-12-10", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.75, + "output": 3.2, + "cache_read": 0.375 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/llama-3.2-3b", + "name": "Llama 3.2 3B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-10-03", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.6 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/llama-3.3-70b", + "name": "Llama 3.3 70B", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2025-04-06", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 2.8 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/minimax-m21", + "name": "MiniMax M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-12-01", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.04 + }, + "limit": { + "context": 198000, + "output": 49500 + } + }, + { + "id": "venice/minimax-m25", + "name": "MiniMax M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.04 + }, + "limit": { + "context": 198000, + "output": 32000 + } + }, + { + "id": "venice/mistral-31-24b", + "name": "Venice Medium", + "family": "mistral", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2025-03-18", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.5, + "output": 2.0 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/olafangensan-glm-4.7-flash-heretic", + "name": "GLM 4.7 Flash Heretic", + "family": "glm-flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-04", + "last_updated": "2026-02-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.14, + "output": 0.8 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/openai-gpt-52", + "name": "GPT-5.2", + "family": "gpt", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08-31", + "release_date": "2025-12-13", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/openai-gpt-52-codex", + "name": "GPT-5.2 Codex", + "family": "gpt-codex", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2025-01-15", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/openai-gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "family": "gpt-oss", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-11-06", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.07, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/qwen3-235b-a22b-instruct", + "name": "Qwen 3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 0.75 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/qwen3-235b-a22b-thinking", + "name": "Qwen 3 235B A22B Thinking 2507", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.45, + "output": 3.5 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/qwen3-4b", + "name": "Venice Small", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.05, + "output": 0.15 + }, + "limit": { + "context": 32000, + "output": 8000 + } + }, + { + "id": "venice/qwen3-coder-480b-a35b-instruct", + "name": "Qwen 3 Coder 480b", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.75, + "output": 3.0 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/qwen3-next-80b", + "name": "Qwen 3 Next 80b", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.35, + "output": 1.9 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/qwen3-vl-235b-a22b", + "name": "Qwen3 VL 235B", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-16", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.25, + "output": 1.5 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "venice/venice-uncensored", + "name": "Venice Uncensored 1.1", + "family": "venice", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-10", + "release_date": "2025-03-18", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.2, + "output": 0.9 + }, + "limit": { + "context": 32000, + "output": 8000 + } + }, + { + "id": "venice/zai-org-glm-4.7", + "name": "GLM 4.7", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-12-24", + "last_updated": "2026-01-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.55, + "output": 2.65, + "cache_read": 0.11 + }, + "limit": { + "context": 198000, + "output": 49500 + } + }, + { + "id": "venice/zai-org-glm-4.7-flash", + "name": "GLM 4.7 Flash", + "family": "glm-flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-01-29", + "last_updated": "2026-02-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.125, + "output": 0.5 + }, + "limit": { + "context": 128000, + "output": 32000 + } + }, + { + "id": "venice/zai-org-glm-5", + "name": "GLM 5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 3.2, + "cache_read": 0.2 + }, + "limit": { + "context": 198000, + "output": 49500 + } + }, + { + "id": "vercel/alibaba/qwen-3-14b", + "name": "Qwen3-14B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.06, + "output": 0.24 + }, + "limit": { + "context": 40960, + "output": 16384 + } + }, + { + "id": "vercel/alibaba/qwen-3-235b", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.13, + "output": 0.6 + }, + "limit": { + "context": 40960, + "output": 16384 + } + }, + { + "id": "vercel/alibaba/qwen-3-30b", + "name": "Qwen3-30B-A3B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.08, + "output": 0.29 + }, + "limit": { + "context": 40960, + "output": 16384 + } + }, + { + "id": "vercel/alibaba/qwen-3-32b", + "name": "Qwen 3.32B", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 40960, + "output": 16384 + } + }, + { + "id": "vercel/alibaba/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.9 + }, + "limit": { + "context": 262114, + "output": 262114 + } + }, + { + "id": "vercel/alibaba/qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.38, + "output": 1.53 + }, + "limit": { + "context": 262144, + "output": 66536 + } + }, + { + "id": "vercel/alibaba/qwen3-coder-30b-a3b", + "name": "Qwen 3 Coder 30B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.07, + "output": 0.27 + }, + "limit": { + "context": 160000, + "output": 32768 + } + }, + { + "id": "vercel/alibaba/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2025-07-22", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 1.2 + }, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "vercel/alibaba/qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.0, + "output": 5.0 + }, + "limit": { + "context": 1000000, + "output": 1000000 + } + }, + { + "id": "vercel/alibaba/qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.01, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "vercel/alibaba/qwen3-embedding-4b", + "name": "Qwen3 Embedding 4B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.02, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "vercel/alibaba/qwen3-embedding-8b", + "name": "Qwen3 Embedding 8B", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "vercel/alibaba/qwen3-max", + "name": "Qwen3 Max", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.2, + "output": 6.0 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "vercel/alibaba/qwen3-max-preview", + "name": "Qwen3 Max Preview", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.2, + "output": 6.0, + "cache_read": 0.24 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "vercel/alibaba/qwen3-max-thinking", + "name": "Qwen 3 Max Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-01", + "last_updated": "2025-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.2, + "output": 6.0, + "cache_read": 0.24 + }, + "limit": { + "context": 256000, + "output": 65536 + } + }, + { + "id": "vercel/alibaba/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "family": "qwen", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.09, + "output": 1.1 + }, + "limit": { + "context": 262144, + "output": 32768 + } + }, + { + "id": "vercel/alibaba/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "family": "qwen", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.15, + "output": 1.5 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "vercel/alibaba/qwen3-vl-instruct", + "name": "Qwen3 VL Instruct", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 2.8 + }, + "limit": { + "context": 131072, + "output": 129024 + } + }, + { + "id": "vercel/alibaba/qwen3-vl-thinking", + "name": "Qwen3 VL Thinking", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.7, + "output": 8.4 + }, + "limit": { + "context": 131072, + "output": 129024 + } + }, + { + "id": "vercel/alibaba/qwen3.5-plus", + "name": "Qwen 3.5 Plus", + "family": "qwen", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-16", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 2.4, + "cache_read": 0.04, + "cache_write": 0.5 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "vercel/amazon/nova-2-lite", + "name": "Nova 2 Lite", + "family": "nova", + "attachment": true, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5 + }, + "limit": { + "context": 1000000, + "output": 1000000 + } + }, + { + "id": "vercel/amazon/nova-lite", + "name": "Nova Lite", + "family": "nova-lite", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 + }, + "limit": { + "context": 300000, + "output": 8192 + } + }, + { + "id": "vercel/amazon/nova-micro", + "name": "Nova Micro", + "family": "nova-micro", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "vercel/amazon/nova-pro", + "name": "Nova Pro", + "family": "nova-pro", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 + }, + "limit": { + "context": 300000, + "output": 8192 + } + }, + { + "id": "vercel/amazon/titan-embed-text-v2", + "name": "Titan Text Embeddings V2", + "family": "titan-embed", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-04", + "last_updated": "2024-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.02, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 1536 + } + }, + { + "id": "vercel/anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "vercel/anthropic/claude-3-opus", + "name": "Claude Opus 3", + "family": "claude-opus", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 4096 + } + }, + { + "id": "vercel/anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.8, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "vercel/anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "family": "claude-sonnet", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 8192 + } + }, + { + "id": "vercel/anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "vercel/anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "family": "claude-haiku", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "vercel/anthropic/claude-opus-4", + "name": "Claude Opus 4", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "vercel/anthropic/claude-opus-4.1", + "name": "Claude Opus 4", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 32000 + } + }, + { + "id": "vercel/anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 18.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "vercel/anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-02", + "last_updated": "2026-02", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "vercel/anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "vercel/anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 200000, + "output": 64000 + } + }, + { + "id": "vercel/anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "limit": { + "context": 1000000, + "output": 128000 + } + }, + { + "id": "vercel/arcee-ai/trinity-large-preview", + "name": "Trinity Large Preview", + "family": "trinity", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-01", + "last_updated": "2025-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 131000, + "output": 131000 + } + }, + { + "id": "vercel/arcee-ai/trinity-mini", + "name": "Trinity Mini", + "family": "trinity", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-12", + "last_updated": "2025-12", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.05, + "output": 0.15 + }, + "limit": { + "context": 131072, + "output": 131072 + } + }, + { + "id": "vercel/bfl/flux-kontext-max", + "name": "FLUX.1 Kontext Max", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-06", + "last_updated": "2025-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 512, + "output": 0 + } + }, + { + "id": "vercel/bfl/flux-kontext-pro", + "name": "FLUX.1 Kontext Pro", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-06", + "last_updated": "2025-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 512, + "output": 0 + } + }, + { + "id": "vercel/bfl/flux-pro-1.0-fill", + "name": "FLUX.1 Fill [pro]", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-10", + "last_updated": "2024-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 512, + "output": 0 + } + }, + { + "id": "vercel/bfl/flux-pro-1.1", + "name": "FLUX1.1 [pro]", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-10", + "last_updated": "2024-10", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 512, + "output": 0 + } + }, + { + "id": "vercel/bfl/flux-pro-1.1-ultra", + "name": "FLUX1.1 [pro] Ultra", + "family": "flux", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-11", + "last_updated": "2024-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 512, + "output": 0 + } + }, + { + "id": "vercel/bytedance/seed-1.6", + "name": "Seed 1.6", + "family": "seed", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09", + "last_updated": "2025-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.05 + }, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "vercel/bytedance/seed-1.8", + "name": "Seed 1.8", + "family": "seed", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-10", + "last_updated": "2025-10", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 2.0, + "cache_read": 0.05 + }, + "limit": { + "context": 256000, + "output": 64000 + } + }, + { + "id": "vercel/cohere/command-a", + "name": "Command A", + "family": "command", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.5, + "output": 10.0 + }, + "limit": { + "context": 256000, + "output": 8000 + } + }, + { + "id": "vercel/cohere/embed-v4.0", + "name": "Embed v4.0", + "family": "cohere-embed", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.12, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 1536 + } + }, + { + "id": "vercel/deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.35, + "output": 5.4 + }, + "limit": { + "context": 128000, + "output": 32768 + } + }, + { + "id": "vercel/deepseek/deepseek-v3", + "name": "DeepSeek V3 0324", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.77, + "output": 0.77 + }, + "limit": { + "context": 163840, + "output": 16384 + } + }, + { + "id": "vercel/deepseek/deepseek-v3.1", + "name": "DeepSeek-V3.1", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.0 + }, + "limit": { + "context": 163840, + "output": 128000 + } + }, + { + "id": "vercel/deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.0 + }, + "limit": { + "context": 131072, + "output": 65536 + } + }, + { + "id": "vercel/deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.4, + "cache_read": 0.22 + }, + "limit": { + "context": 163842, + "output": 8000 + } + }, + { + "id": "vercel/deepseek/deepseek-v3.2-exp", + "name": "DeepSeek V3.2 Exp", + "family": "deepseek", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.27, + "output": 0.4 + }, + "limit": { + "context": 163840, + "output": 163840 + } + }, + { + "id": "vercel/deepseek/deepseek-v3.2-thinking", + "name": "DeepSeek V3.2 Thinking", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.28, + "output": 0.42, + "cache_read": 0.03 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "vercel/google/gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "vercel/google/gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.075, + "output": 0.3 + }, + "limit": { + "context": 1048576, + "output": 8192 + } + }, + { + "id": "vercel/google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "vercel/google/gemini-2.5-flash-image", + "name": "Nano Banana (Gemini 2.5 Flash Image)", + "family": "gemini-flash", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "vercel/google/gemini-2.5-flash-image-preview", + "name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", + "family": "gemini-flash", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5 + }, + "limit": { + "context": 32768, + "output": 32768 + } + }, + { + "id": "vercel/google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.01 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "vercel/google/gemini-2.5-flash-lite-preview-09", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "family": "gemini-flash-lite", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.01 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "vercel/google/gemini-2.5-flash-preview-09", + "name": "Gemini 2.5 Flash Preview 09-25", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "cache_write": 0.383 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "vercel/google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 1.25, + "output": 10.0, + "cache_read": 0.31 + }, + "limit": { + "context": 1048576, + "output": 65536 + } + }, + { + "id": "vercel/google/gemini-3-flash", + "name": "Gemini 3 Flash", + "family": "gemini-flash", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.5, + "output": 3.0, + "cache_read": 0.05 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "vercel/google/gemini-3-pro-image", + "name": "Nano Banana Pro (Gemini 3 Pro Image)", + "family": "gemini-pro", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2025-03", + "release_date": "2025-09", + "last_updated": "2025-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text", + "image" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 120.0 + }, + "limit": { + "context": 65536, + "output": 32768 + } + }, + { + "id": "vercel/google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 + }, + "limit": { + "context": 1000000, + "output": 64000 + } + }, + { + "id": "vercel/google/gemini-embedding-001", + "name": "Gemini Embedding 001", + "family": "gemini-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 1536 + } + }, + { + "id": "vercel/google/imagen-4.0-fast-generate-001", + "name": "Imagen 4 Fast", + "family": "imagen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-06", + "last_updated": "2025-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "vercel/google/imagen-4.0-generate-001", + "name": "Imagen 4", + "family": "imagen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "vercel/google/imagen-4.0-ultra-generate-001", + "name": "Imagen 4 Ultra", + "family": "imagen", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-05-24", + "last_updated": "2025-05-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 480, + "output": 0 + } + }, + { + "id": "vercel/google/text-embedding-005", + "name": "Text Embedding 005", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-08", + "last_updated": "2024-08", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.03, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 1536 + } + }, + { + "id": "vercel/google/text-multilingual-embedding-002", + "name": "Text Multilingual Embedding 002", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-03", + "last_updated": "2024-03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.03, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 1536 + } + }, + { + "id": "vercel/inception/mercury-coder-small", + "name": "Mercury Coder Small Beta", + "family": "mercury", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-02-26", + "last_updated": "2025-02-26", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.25, + "output": 1.0 + }, + "limit": { + "context": 32000, + "output": 16384 + } + }, + { + "id": "vercel/kwaipilot/kat-coder-pro-v1", + "name": "KAT-Coder-Pro V1", + "family": "kat-coder", + "attachment": false, + "reasoning": true, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-10-24", + "last_updated": "2025-10-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 32000 + } + }, + { + "id": "vercel/meituan/longcat-flash-chat", + "name": "LongCat Flash Chat", + "family": "longcat", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-08-30", + "last_updated": "2025-08-30", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "vercel/meituan/longcat-flash-thinking", + "name": "LongCat Flash Thinking", + "family": "longcat", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 1.5 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "vercel/meta/llama-3.1-70b", + "name": "Llama 3.1 70B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.4, + "output": 0.4 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "vercel/meta/llama-3.1-8b", + "name": "Llama 3.1 8B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.03, + "output": 0.05 + }, + "limit": { + "context": 131072, + "output": 16384 + } + }, + { + "id": "vercel/meta/llama-3.2-11b", + "name": "Llama 3.2 11B Vision Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.16, + "output": 0.16 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "vercel/meta/llama-3.2-1b", + "name": "Llama 3.2 1B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "vercel/meta/llama-3.2-3b", + "name": "Llama 3.2 3B Instruct", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.15 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "vercel/meta/llama-3.2-90b", + "name": "Llama 3.2 90B Vision Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.72, + "output": 0.72 + }, + "limit": { + "context": 128000, + "output": 8192 + } + }, + { + "id": "vercel/meta/llama-3.3-70b", + "name": "Llama-3.3-70B-Instruct", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "vercel/meta/llama-4-maverick", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "vercel/meta/llama-4-scout", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "family": "llama", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 128000, + "output": 4096 + } + }, + { + "id": "vercel/minimax/minimax-m2", + "name": "MiniMax M2", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.27, + "output": 1.15, + "cache_read": 0.03, + "cache_write": 0.38 + }, + "limit": { + "context": 262114, + "output": 262114 + } + }, + { + "id": "vercel/minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.38 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "vercel/minimax/minimax-m2.1-lightning", + "name": "MiniMax M2.1 Lightning", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 2.4, + "cache_read": 0.03, + "cache_write": 0.38 + }, + "limit": { + "context": 204800, + "output": 131072 + } + }, + { + "id": "vercel/minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "family": "minimax", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-19", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 + }, + "limit": { + "context": 204800, + "output": 131000 + } + }, + { + "id": "vercel/mistral/codestral", + "name": "Codestral", + "family": "codestral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.3, + "output": 0.9 + }, + "limit": { + "context": 256000, + "output": 4096 + } + }, + { + "id": "vercel/mistral/codestral-embed", + "name": "Codestral Embed", + "family": "codestral-embed", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.15, + "output": 0.0 + }, + "limit": { + "context": 8192, + "output": 1536 + } + }, + { + "id": "vercel/mistral/devstral-2", + "name": "Devstral 2", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "vercel/mistral/devstral-small", + "name": "Devstral Small 1.1", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.1, + "output": 0.3 + }, + "limit": { + "context": 128000, + "output": 64000 + } + }, + { + "id": "vercel/mistral/devstral-small-2", + "name": "Devstral Small 2", + "family": "devstral", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": {}, + "limit": { + "context": 256000, + "output": 256000 + } + }, + { + "id": "vercel/mistral/magistral-medium", + "name": "Magistral Medium", + "family": "magistral-medium", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 2.0, + "output": 5.0 }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 } }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "family": "gpt-pro", - "attachment": true, + "id": "vercel/mistral/magistral-small", + "name": "Magistral Small", + "family": "magistral-small", + "attachment": false, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "temperature": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 21.0, - "output": 168.0 + "input": 0.5, + "output": 1.5 }, "limit": { - "context": 400000, + "context": 128000, "output": 128000 } }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "family": "gpt-codex", + "id": "vercel/mistral/ministral-14b", + "name": "Ministral 14B", + "family": "ministral", "attachment": true, - "reasoning": true, - "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "reasoning": false, + "tool_call": false, + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "modalities": { "input": [ "text", @@ -9188,89 +79484,82 @@ }, "open_weights": false, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 0.2, + "output": 0.2 }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 256000 } }, { - "id": "openai/gpt-5.3-codex-spark", - "name": "GPT-5.3 Codex Spark", - "family": "gpt-codex-spark", - "attachment": true, - "reasoning": true, + "id": "vercel/mistral/ministral-3b", + "name": "Ministral 3B", + "family": "ministral", + "attachment": false, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 0.04, + "output": 0.04 }, "limit": { "context": 128000, - "output": 32000 + "output": 128000 } }, { - "id": "openai/o1", - "name": "o1", - "family": "o", - "attachment": true, - "reasoning": true, + "id": "vercel/mistral/ministral-8b", + "name": "Ministral 8B", + "family": "ministral", + "attachment": false, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "temperature": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 15.0, - "output": 60.0, - "cache_read": 7.5 + "input": 0.1, + "output": 0.1 }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 128000 } }, { - "id": "openai/o1-mini", - "name": "o1-mini", - "family": "o-mini", + "id": "vercel/mistral/mistral-embed", + "name": "Mistral Embed", + "family": "mistral-embed", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": false, "temperature": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "modalities": { "input": [ "text" @@ -9281,29 +79570,29 @@ }, "open_weights": false, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.1, + "output": 0.0 }, "limit": { - "context": 128000, - "output": 65536 + "context": 8192, + "output": 1536 } }, { - "id": "openai/o1-preview", - "name": "o1-preview", - "family": "o", - "attachment": false, - "reasoning": true, + "id": "vercel/mistral/mistral-large-3", + "name": "Mistral Large 3", + "family": "mistral-large", + "attachment": true, + "reasoning": false, "tool_call": false, "temperature": true, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2024-10", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -9311,26 +79600,25 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 60.0, - "cache_read": 7.5 + "input": 0.5, + "output": 1.5 }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 256000 } }, { - "id": "openai/o1-pro", - "name": "o1-pro", - "family": "o-pro", + "id": "vercel/mistral/mistral-medium", + "name": "Mistral Medium 3.1", + "family": "mistral-medium", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2023-09", - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "modalities": { "input": [ "text", @@ -9342,29 +79630,28 @@ }, "open_weights": false, "cost": { - "input": 150.0, - "output": 600.0 + "input": 0.4, + "output": 2.0 }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 64000 } }, { - "id": "openai/o3", - "name": "o3", - "family": "o", - "attachment": true, - "reasoning": true, + "id": "vercel/mistral/mistral-nemo", + "name": "Mistral Nemo", + "family": "mistral-nemo", + "attachment": false, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -9372,26 +79659,25 @@ }, "open_weights": false, "cost": { - "input": 2.0, - "output": 8.0, - "cache_read": 0.5 + "input": 0.04, + "output": 0.17 }, "limit": { - "context": 200000, - "output": 100000 + "context": 60288, + "output": 16000 } }, { - "id": "openai/o3-deep-research", - "name": "o3-deep-research", - "family": "o", - "attachment": true, - "reasoning": true, + "id": "vercel/mistral/mistral-small", + "name": "Mistral Small", + "family": "mistral-small", + "attachment": false, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "temperature": true, + "knowledge": "2025-03", + "release_date": "2024-09-01", + "last_updated": "2024-09-04", "modalities": { "input": [ "text", @@ -9401,28 +79687,27 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 10.0, - "output": 40.0, - "cache_read": 2.5 + "input": 0.1, + "output": 0.3 }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 16384 } }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "family": "o-mini", + "id": "vercel/mistral/mixtral-8x22b-instruct", + "name": "Mixtral 8x22B", + "family": "mixtral", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "temperature": true, + "knowledge": "2024-04", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "modalities": { "input": [ "text" @@ -9431,28 +79716,27 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 2.0, + "output": 6.0 }, "limit": { - "context": 200000, - "output": 100000 + "context": 64000, + "output": 64000 } }, { - "id": "openai/o3-pro", - "name": "o3-pro", - "family": "o-pro", + "id": "vercel/mistral/pixtral-12b", + "name": "Pixtral 12B", + "family": "pixtral", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "temperature": true, + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "modalities": { "input": [ "text", @@ -9462,27 +79746,27 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 20.0, - "output": 80.0 + "input": 0.15, + "output": 0.15 }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 128000 } }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "family": "o-mini", + "id": "vercel/mistral/pixtral-large", + "name": "Pixtral Large", + "family": "pixtral", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "temperature": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "modalities": { "input": [ "text", @@ -9492,59 +79776,56 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 2.0, + "output": 6.0 }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 128000 } }, { - "id": "openai/o4-mini-deep-research", - "name": "o4-mini-deep-research", - "family": "o-mini", - "attachment": true, - "reasoning": true, + "id": "vercel/moonshotai/kimi-k2", + "name": "Kimi K2 Instruct", + "family": "kimi", + "attachment": false, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "temperature": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 2.0, - "output": 8.0, - "cache_read": 0.5 + "input": 1.0, + "output": 3.0 }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 16384 } }, { - "id": "openai/text-embedding-3-large", - "name": "text-embedding-3-large", - "family": "text-embedding", + "id": "vercel/moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "family": "kimi-thinking", "attachment": false, - "reasoning": false, - "tool_call": false, - "temperature": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "modalities": { "input": [ "text" @@ -9555,25 +79836,26 @@ }, "open_weights": false, "cost": { - "input": 0.13, - "output": 0.0 + "input": 0.47, + "output": 2.0, + "cache_read": 0.14 }, "limit": { - "context": 8191, - "output": 3072 + "context": 216144, + "output": 216144 } }, { - "id": "openai/text-embedding-3-small", - "name": "text-embedding-3-small", - "family": "text-embedding", + "id": "vercel/moonshotai/kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "family": "kimi-thinking", "attachment": false, - "reasoning": false, - "tool_call": false, - "temperature": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "modalities": { "input": [ "text" @@ -9584,25 +79866,26 @@ }, "open_weights": false, "cost": { - "input": 0.02, - "output": 0.0 + "input": 1.15, + "output": 8.0, + "cache_read": 0.15 }, "limit": { - "context": 8191, - "output": 1536 + "context": 262114, + "output": 262114 } }, { - "id": "openai/text-embedding-ada-002", - "name": "text-embedding-ada-002", - "family": "text-embedding", + "id": "vercel/moonshotai/kimi-k2-turbo", + "name": "Kimi K2 Turbo", + "family": "kimi", "attachment": false, "reasoning": false, - "tool_call": false, - "temperature": false, - "knowledge": "2022-12", - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "tool_call": true, + "temperature": true, + "knowledge": "2024-08", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "modalities": { "input": [ "text" @@ -9613,25 +79896,25 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.0 + "input": 2.4, + "output": 10.0 }, "limit": { - "context": 8192, - "output": 1536 + "context": 256000, + "output": 16384 } }, { - "id": "openrouter/allenai/molmo-2-8b:free", - "name": "Molmo2 8B (free)", - "family": "allenai", - "attachment": false, + "id": "vercel/moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "family": "kimi", + "attachment": true, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2026-01-09", - "last_updated": "2026-01-31", + "knowledge": "2025-01", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "modalities": { "input": [ "text", @@ -9644,30 +79927,27 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.6, + "output": 1.2 }, "limit": { - "context": 36864, - "output": 36864 + "context": 262144, + "output": 262144 } }, { - "id": "openrouter/anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5", - "family": "claude-haiku", - "attachment": true, + "id": "vercel/morph/morph-v3-fast", + "name": "Morph v3 Fast", + "family": "morph", + "attachment": false, "reasoning": false, - "tool_call": true, - "temperature": true, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "tool_call": false, + "temperature": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -9676,31 +79956,55 @@ "open_weights": false, "cost": { "input": 0.8, - "output": 4.0, - "cache_read": 0.08, - "cache_write": 1.0 + "output": 1.2 }, "limit": { - "context": 200000, - "output": 8192 + "context": 16000, + "output": 16000 } }, { - "id": "openrouter/anthropic/claude-3.7-sonnet", - "name": "Claude Sonnet 3.7", - "family": "claude-sonnet", - "attachment": true, + "id": "vercel/morph/morph-v3-large", + "name": "Morph v3 Large", + "family": "morph", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.9, + "output": 1.9 + }, + "limit": { + "context": 32000, + "output": 32000 + } + }, + { + "id": "vercel/nvidia/nemotron-3-nano-30b-a3b", + "name": "Nemotron 3 Nano 30B A3B", + "family": "nemotron", + "attachment": false, "reasoning": true, - "tool_call": true, + "tool_call": false, "temperature": true, - "knowledge": "2024-01", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-10", + "release_date": "2024-12", + "last_updated": "2024-12", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -9708,32 +80012,29 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.06, + "output": 0.24 }, "limit": { - "context": 200000, - "output": 128000 + "context": 262144, + "output": 262144 } }, { - "id": "openrouter/anthropic/claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "family": "claude-haiku", + "id": "vercel/nvidia/nemotron-nano-12b-v2-vl", + "name": "Nvidia Nemotron Nano 12B V2 VL", + "family": "nemotron", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-10", + "release_date": "2024-12", + "last_updated": "2024-12", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -9741,32 +80042,28 @@ }, "open_weights": false, "cost": { - "input": 1.0, - "output": 5.0, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.2, + "output": 0.6 }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 } }, { - "id": "openrouter/anthropic/claude-opus-4", - "name": "Claude Opus 4", - "family": "claude-opus", - "attachment": true, + "id": "vercel/nvidia/nemotron-nano-9b-v2", + "name": "Nvidia Nemotron Nano 9B V2", + "family": "nemotron", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-10", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -9774,27 +80071,25 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.04, + "output": 0.16 }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 131072 } }, { - "id": "openrouter/anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1", - "family": "claude-opus", + "id": "vercel/openai/codex-mini", + "name": "Codex Mini", + "family": "gpt-codex-mini", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-10", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "modalities": { "input": [ "text", @@ -9807,32 +80102,29 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 75.0, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.5, + "output": 6.0, + "cache_read": 0.38 }, "limit": { "context": 200000, - "output": 32000 + "output": 100000 } }, { - "id": "openrouter/anthropic/claude-opus-4.5", - "name": "Claude Opus 4.5", - "family": "claude-opus", - "attachment": true, - "reasoning": true, - "tool_call": true, + "id": "vercel/openai/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": false, "temperature": true, - "knowledge": "2025-05-30", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2021-09", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -9840,32 +80132,28 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.5, + "output": 1.5 }, "limit": { - "context": 200000, - "output": 32000 + "context": 16385, + "output": 4096 } }, { - "id": "openrouter/anthropic/claude-opus-4.6", - "name": "Claude Opus 4.6", - "family": "claude-opus", - "attachment": true, - "reasoning": true, - "tool_call": true, + "id": "vercel/openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "family": "gpt", + "attachment": false, + "reasoning": false, + "tool_call": false, "temperature": true, - "knowledge": "2025-05-30", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2021-09", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -9873,32 +80161,29 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.5, + "output": 2.0 }, "limit": { - "context": 1000000, - "output": 128000 + "context": 8192, + "output": 4096 } }, { - "id": "openrouter/anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "family": "claude-sonnet", + "id": "vercel/openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "family": "gpt", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -9906,32 +80191,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 10.0, + "output": 30.0 }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 } }, { - "id": "openrouter/anthropic/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "family": "claude-sonnet", + "id": "vercel/openai/gpt-4.1", + "name": "GPT-4.1", + "family": "gpt", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -9939,617 +80221,657 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1047576, + "output": 32768 } }, { - "id": "openrouter/arcee-ai/trinity-large-preview:free", - "name": "Trinity Large Preview", - "family": "trinity", - "attachment": false, + "id": "vercel/openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "family": "gpt-mini", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2026-01-28", - "last_updated": "2026-01-28", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "limit": { - "context": 131072, - "output": 131072 + "context": 1047576, + "output": 32768 } }, { - "id": "openrouter/arcee-ai/trinity-mini:free", - "name": "Trinity Mini", - "family": "trinity-mini", - "attachment": false, + "id": "vercel/openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "family": "gpt-nano", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2026-01-28", - "last_updated": "2026-01-28", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "limit": { - "context": 131072, - "output": 131072 + "context": 1047576, + "output": 32768 } }, { - "id": "openrouter/black-forest-labs/flux.2-flex", - "name": "FLUX.2 Flex", - "family": "flux", - "attachment": false, + "id": "vercel/openai/gpt-4o", + "name": "GPT-4o", + "family": "gpt", + "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-11-25", - "last_updated": "2026-01-31", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ - "image", "text" ] }, "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 2.5, + "output": 10.0, + "cache_read": 1.25 }, "limit": { - "context": 67344, - "output": 67344 + "context": 128000, + "output": 16384 } }, { - "id": "openrouter/black-forest-labs/flux.2-klein-4b", - "name": "FLUX.2 Klein 4B", - "family": "flux", - "attachment": false, + "id": "vercel/openai/gpt-4o-mini", + "name": "GPT-4o mini", + "family": "gpt-mini", + "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2026-01-14", - "last_updated": "2026-01-31", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ - "image", "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "limit": { - "context": 40960, - "output": 40960 + "context": 128000, + "output": 16384 } }, { - "id": "openrouter/black-forest-labs/flux.2-max", - "name": "FLUX.2 Max", - "family": "flux", + "id": "vercel/openai/gpt-4o-mini-search-preview", + "name": "GPT 4o Mini Search Preview", + "family": "gpt-mini", "attachment": false, "reasoning": false, "tool_call": false, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-12-16", - "last_updated": "2026-01-31", + "knowledge": "2023-09", + "release_date": "2025-01", + "last_updated": "2025-01", "modalities": { "input": [ - "image", "text" ], "output": [ - "image", "text" ] }, "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.15, + "output": 0.6 }, "limit": { - "context": 46864, - "output": 46864 + "context": 128000, + "output": 16384 } }, { - "id": "openrouter/black-forest-labs/flux.2-pro", - "name": "FLUX.2 Pro", - "family": "flux", - "attachment": false, - "reasoning": false, - "tool_call": false, - "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-11-25", - "last_updated": "2026-01-31", + "id": "vercel/openai/gpt-5", + "name": "GPT-5", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ - "image", "text" ] }, "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 }, "limit": { - "context": 46864, - "output": 46864 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/bytedance-seed/seedream-4.5", - "name": "Seedream 4.5", - "family": "seed", - "attachment": false, - "reasoning": false, - "tool_call": false, + "id": "vercel/openai/gpt-5-chat", + "name": "GPT-5 Chat", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-12-23", - "last_updated": "2026-01-31", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ - "image", - "text" + "text", + "image" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 16384 } }, { - "id": "openrouter/cognitivecomputations/dolphin-mistral-24b-venice-edition:free", - "name": "Uncensored (free)", - "family": "mistral", + "id": "vercel/openai/gpt-5-codex", + "name": "GPT-5-Codex", + "family": "gpt-codex", "attachment": false, - "reasoning": false, - "tool_call": false, - "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-07-09", - "last_updated": "2026-01-31", + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 }, "limit": { - "context": 32768, - "output": 32768 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/cognitivecomputations/dolphin3.0-mistral-24b", - "name": "Dolphin3.0 Mistral 24B", - "family": "mistral", - "attachment": false, - "reasoning": false, + "id": "vercel/openai/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-02-13", - "last_updated": "2025-02-13", + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.25, + "output": 2.0, + "cache_read": 0.025 }, "limit": { - "context": 32768, - "output": 8192 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/cognitivecomputations/dolphin3.0-r1-mistral-24b", - "name": "Dolphin3.0 R1 Mistral 24B", - "family": "mistral", - "attachment": false, + "id": "vercel/openai/gpt-5-nano", + "name": "GPT-5 Nano", + "family": "gpt-nano", + "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-02-13", - "last_updated": "2025-02-13", + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "limit": { - "context": 32768, - "output": 8192 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/deepseek/deepseek-chat-v3", - "name": "DeepSeek V3 0324", - "family": "deepseek", - "attachment": false, - "reasoning": false, - "tool_call": false, + "id": "vercel/openai/gpt-5-pro", + "name": "GPT-5 pro", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, "temperature": true, "knowledge": "2024-10", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 15.0, + "output": 120.0 }, "limit": { - "context": 16384, - "output": 8192 + "context": 400000, + "output": 272000 } }, { - "id": "openrouter/deepseek/deepseek-chat-v3.1", - "name": "DeepSeek-V3.1", - "family": "deepseek", - "attachment": false, + "id": "vercel/openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "family": "gpt", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.2, - "output": 0.8 + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 }, "limit": { - "context": 163840, - "output": 163840 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/deepseek/deepseek-r1-0528-qwen3-8b:free", - "name": "Deepseek R1 0528 Qwen3 8B (free)", - "family": "qwen", - "attachment": false, + "id": "vercel/openai/gpt-5.1-codex-max", + "name": "GPT 5.1 Codex Max", + "family": "gpt", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-05-29", - "last_updated": "2025-05-29", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/deepseek/deepseek-r1-0528:free", - "name": "R1 0528 (free)", - "family": "deepseek", - "attachment": false, + "id": "vercel/openai/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "family": "gpt", + "attachment": true, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "knowledge": "2024-10", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.25, + "output": 2.0, + "cache_read": 0.03 }, "limit": { - "context": 163840, - "output": 163840 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "family": "deepseek-thinking", - "attachment": false, + "id": "vercel/openai/gpt-5.1-instant", + "name": "GPT-5.1 Instant", + "family": "gpt", + "attachment": true, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, "knowledge": "2024-10", - "release_date": "2025-01-23", - "last_updated": "2025-01-23", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 } }, { - "id": "openrouter/deepseek/deepseek-r1-distill-qwen-14b", - "name": "DeepSeek R1 Distill Qwen 14B", - "family": "qwen", - "attachment": false, + "id": "vercel/openai/gpt-5.1-thinking", + "name": "GPT 5.1 Thinking", + "family": "gpt", + "attachment": true, "reasoning": true, - "tool_call": false, - "temperature": true, + "tool_call": true, + "temperature": false, "knowledge": "2024-10", - "release_date": "2025-01-29", - "last_updated": "2025-01-29", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.25, + "output": 10.0, + "cache_read": 0.13 }, "limit": { - "context": 64000, - "output": 8192 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/deepseek/deepseek-r1:free", - "name": "R1 (free)", - "family": "deepseek", - "attachment": false, + "id": "vercel/openai/gpt-5.2", + "name": "GPT-5.2", + "family": "gpt", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.75, + "output": 14.0, + "cache_read": 0.18 }, "limit": { - "context": 163840, - "output": 163840 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/deepseek/deepseek-v3-base:free", - "name": "DeepSeek V3 Base (free)", - "family": "deepseek", - "attachment": false, - "reasoning": false, - "tool_call": false, + "id": "vercel/openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "family": "gpt", + "attachment": true, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2025-03", - "release_date": "2025-03-29", - "last_updated": "2025-03-29", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.75, + "output": 14.0, + "cache_read": 0.18 }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 16384 } }, { - "id": "openrouter/deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "family": "deepseek", - "attachment": false, + "id": "vercel/openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "family": "gpt-codex", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2024-10", + "release_date": "2025-12", + "last_updated": "2025-12", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.27, - "output": 1.0 + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/deepseek/deepseek-v3.1-terminus:exacto", - "name": "DeepSeek V3.1 Terminus (exacto)", - "family": "deepseek", - "attachment": false, + "id": "vercel/openai/gpt-5.2-pro", + "name": "GPT 5.2 ", + "family": "gpt", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.27, - "output": 1.0 + "input": 21.0, + "output": 168.0 }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/deepseek/deepseek-v3.2", - "name": "DeepSeek V3.2", - "family": "deepseek", + "id": "vercel/openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-10", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "modalities": { "input": [ "text" @@ -10560,25 +80882,25 @@ }, "open_weights": true, "cost": { - "input": 0.28, - "output": 0.4 + "input": 0.1, + "output": 0.5 }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 131072 } }, { - "id": "openrouter/deepseek/deepseek-v3.2-speciale", - "name": "DeepSeek V3.2 Speciale", - "family": "deepseek", + "id": "vercel/openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "family": "gpt-oss", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-10", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "modalities": { "input": [ "text" @@ -10589,25 +80911,25 @@ }, "open_weights": true, "cost": { - "input": 0.27, - "output": 0.41 + "input": 0.07, + "output": 0.3 }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 32768 } }, { - "id": "openrouter/featherless/qwerky-72b", - "name": "Qwerky 72B", - "family": "qwerky", + "id": "vercel/openai/gpt-oss-safeguard-20b", + "name": "gpt-oss-safeguard-20b", + "family": "gpt-oss", "attachment": false, - "reasoning": false, - "tool_call": false, + "reasoning": true, + "tool_call": true, "temperature": true, "knowledge": "2024-10", - "release_date": "2025-03-20", - "last_updated": "2025-03-20", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "modalities": { "input": [ "text" @@ -10616,34 +80938,32 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.08, + "output": 0.3, + "cache_read": 0.04 }, "limit": { - "context": 32768, - "output": 8192 + "context": 131072, + "output": 65536 } }, { - "id": "openrouter/google/gemini-2.0-flash-001", - "name": "Gemini 2.0 Flash", - "family": "gemini-flash", + "id": "vercel/openai/o1", + "name": "o1", + "family": "o", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "temperature": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -10651,26 +80971,26 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 15.0, + "output": 60.0, + "cache_read": 7.5 }, "limit": { - "context": 1048576, - "output": 8192 + "context": 200000, + "output": 100000 } }, { - "id": "openrouter/google/gemini-2.0-flash-exp:free", - "name": "Gemini 2.0 Flash Experimental (free)", - "family": "gemini-flash", + "id": "vercel/openai/o3", + "name": "o3", + "family": "o", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-12", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "modalities": { "input": [ "text", @@ -10682,31 +81002,30 @@ }, "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 2.0, + "output": 8.0, + "cache_read": 0.5 }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 200000, + "output": 100000 } }, { - "id": "openrouter/google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "family": "gemini-flash", + "id": "vercel/openai/o3-deep-research", + "name": "o3-deep-research", + "family": "o", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-07-17", - "last_updated": "2025-07-17", + "temperature": false, + "knowledge": "2024-10", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -10715,33 +81034,29 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.0375 + "input": 10.0, + "output": 40.0, + "cache_read": 2.5 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 } }, { - "id": "openrouter/google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "family": "gemini-flash-lite", - "attachment": true, + "id": "vercel/openai/o3-mini", + "name": "o3-mini", + "family": "o-mini", + "attachment": false, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "temperature": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -10749,32 +81064,30 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 } }, { - "id": "openrouter/google/gemini-2.5-flash-lite-preview-09", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "family": "gemini-flash-lite", + "id": "vercel/openai/o3-pro", + "name": "o3 Pro", + "family": "o-pro", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "temperature": false, + "knowledge": "2024-10", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -10783,33 +81096,29 @@ }, "open_weights": false, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 20.0, + "output": 80.0 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 } }, { - "id": "openrouter/google/gemini-2.5-flash-preview-09", - "name": "Gemini 2.5 Flash Preview 09-25", - "family": "gemini-flash", + "id": "vercel/openai/o4-mini", + "name": "o4-mini", + "family": "o-mini", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "temperature": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -10817,33 +81126,28 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.031 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 } }, { - "id": "openrouter/google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "family": "gemini-pro", - "attachment": true, - "reasoning": true, - "tool_call": true, - "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "id": "vercel/openai/text-embedding-3-large", + "name": "text-embedding-3-large", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "modalities": { + "input": [ + "text" ], "output": [ "text" @@ -10851,33 +81155,27 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.31 + "input": 0.13, + "output": 0.0 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 1536 } }, { - "id": "openrouter/google/gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "family": "gemini-pro", - "attachment": true, - "reasoning": true, - "tool_call": true, - "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "id": "vercel/openai/text-embedding-3-small", + "name": "text-embedding-3-small", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -10885,33 +81183,27 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.31 + "input": 0.02, + "output": 0.0 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 1536 } }, { - "id": "openrouter/google/gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "family": "gemini-pro", - "attachment": true, - "reasoning": true, - "tool_call": true, - "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "id": "vercel/openai/text-embedding-ada-002", + "name": "text-embedding-ada-002", + "family": "text-embedding", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": false, + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -10919,33 +81211,29 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.31 + "input": 0.1, + "output": 0.0 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 1536 } }, { - "id": "openrouter/google/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "family": "gemini-flash", + "id": "vercel/perplexity/sonar", + "name": "Sonar", + "family": "sonar", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -10953,33 +81241,29 @@ }, "open_weights": false, "cost": { - "input": 0.5, - "output": 3.0, - "cache_read": 0.05 + "input": 1.0, + "output": 1.0 }, "limit": { - "context": 1048576, - "output": 65536 + "context": 127000, + "output": 8000 } }, { - "id": "openrouter/google/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "family": "gemini-pro", + "id": "vercel/perplexity/sonar-pro", + "name": "Sonar Pro", + "family": "sonar-pro", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -10987,25 +81271,25 @@ }, "open_weights": false, "cost": { - "input": 2.0, - "output": 12.0 + "input": 3.0, + "output": 15.0 }, "limit": { - "context": 1050000, - "output": 66000 + "context": 200000, + "output": 8000 } }, { - "id": "openrouter/google/gemma-2-9b-it", - "name": "Gemma 2 9B", - "family": "gemma", + "id": "vercel/perplexity/sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "family": "sonar-reasoning", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": false, "temperature": true, - "knowledge": "2024-06", - "release_date": "2024-06-28", - "last_updated": "2024-06-28", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "modalities": { "input": [ "text" @@ -11014,40 +81298,39 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.03, - "output": 0.09 + "input": 2.0, + "output": 8.0 }, "limit": { - "context": 8192, - "output": 8192 + "context": 127000, + "output": 8000 } }, { - "id": "openrouter/google/gemma-3-12b-it", - "name": "Gemma 3 12B", - "family": "gemma", - "attachment": true, - "reasoning": false, - "tool_call": false, + "id": "vercel/prime-intellect/intellect-3", + "name": "INTELLECT 3", + "family": "intellect", + "attachment": false, + "reasoning": true, + "tool_call": true, "temperature": true, "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.03, - "output": 0.1 + "input": 0.2, + "output": 1.1 }, "limit": { "context": 131072, @@ -11055,76 +81338,65 @@ } }, { - "id": "openrouter/google/gemma-3-12b-it:free", - "name": "Gemma 3 12B (free)", - "family": "gemma", - "attachment": true, + "id": "vercel/recraft/recraft-v2", + "name": "Recraft V2", + "family": "recraft", + "attachment": false, "reasoning": false, "tool_call": false, - "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "temperature": false, + "release_date": "2024-03", + "last_updated": "2024-03", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, - "open_weights": true, - "cost": { - "input": 0.0, - "output": 0.0 - }, + "open_weights": false, + "cost": {}, "limit": { - "context": 32768, - "output": 8192 + "context": 512, + "output": 0 } }, { - "id": "openrouter/google/gemma-3-27b-it", - "name": "Gemma 3 27B", - "family": "gemma", - "attachment": true, + "id": "vercel/recraft/recraft-v3", + "name": "Recraft V3", + "family": "recraft", + "attachment": false, "reasoning": false, - "tool_call": true, - "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "tool_call": false, + "temperature": false, + "release_date": "2024-10", + "last_updated": "2024-10", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, - "open_weights": true, - "cost": { - "input": 0.04, - "output": 0.15 - }, + "open_weights": false, + "cost": {}, "limit": { - "context": 96000, - "output": 96000 + "context": 512, + "output": 0 } }, { - "id": "openrouter/google/gemma-3-27b-it:free", - "name": "Gemma 3 27B (free)", - "family": "gemma", + "id": "vercel/vercel/v0-1.0-md", + "name": "v0-1.0-md", + "family": "v0", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "modalities": { "input": [ "text", @@ -11134,27 +81406,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 3.0, + "output": 15.0 }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32000 } }, { - "id": "openrouter/google/gemma-3-4b-it", - "name": "Gemma 3 4B", - "family": "gemma", + "id": "vercel/vercel/v0-1.5-md", + "name": "v0-1.5-md", + "family": "v0", "attachment": true, - "reasoning": false, - "tool_call": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "modalities": { "input": [ "text", @@ -11164,57 +81435,54 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.01703, - "output": 0.06815 + "input": 3.0, + "output": 15.0 }, "limit": { - "context": 96000, - "output": 96000 + "context": 128000, + "output": 32000 } }, { - "id": "openrouter/google/gemma-3-4b-it:free", - "name": "Gemma 3 4B (free)", - "family": "gemma", - "attachment": true, + "id": "vercel/voyage/voyage-3-large", + "name": "voyage-3-large", + "family": "voyage", + "attachment": false, "reasoning": false, "tool_call": false, - "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "temperature": false, + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, + "input": 0.18, "output": 0.0 }, "limit": { - "context": 32768, - "output": 8192 + "context": 8192, + "output": 1536 } }, { - "id": "openrouter/google/gemma-3n-e2b-it:free", - "name": "Gemma 3n 2B (free)", - "family": "gemma", - "attachment": true, + "id": "vercel/voyage/voyage-3.5", + "name": "voyage-3.5", + "family": "voyage", + "attachment": false, "reasoning": false, "tool_call": false, - "temperature": true, - "knowledge": "2024-06", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "temperature": false, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "modalities": { "input": [ "text" @@ -11223,25 +81491,24 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, + "input": 0.06, "output": 0.0 }, "limit": { "context": 8192, - "output": 2000 + "output": 1536 } }, { - "id": "openrouter/google/gemma-3n-e4b-it", - "name": "Gemma 3n 4B", - "family": "gemma", - "attachment": true, + "id": "vercel/voyage/voyage-3.5-lite", + "name": "voyage-3.5-lite", + "family": "voyage", + "attachment": false, "reasoning": false, "tool_call": false, - "temperature": true, - "knowledge": "2024-06", + "temperature": false, "release_date": "2025-05-20", "last_updated": "2025-05-20", "modalities": { @@ -11252,27 +81519,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { "input": 0.02, - "output": 0.04 + "output": 0.0 }, "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 1536 } }, { - "id": "openrouter/google/gemma-3n-e4b-it:free", - "name": "Gemma 3n 4B (free)", - "family": "gemma", - "attachment": true, + "id": "vercel/voyage/voyage-code-2", + "name": "voyage-code-2", + "family": "voyage", + "attachment": false, "reasoning": false, "tool_call": false, - "temperature": true, - "knowledge": "2024-06", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "temperature": false, + "release_date": "2024-01", + "last_updated": "2024-01", "modalities": { "input": [ "text" @@ -11281,27 +81547,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, + "input": 0.12, "output": 0.0 }, "limit": { "context": 8192, - "output": 2000 + "output": 1536 } }, { - "id": "openrouter/kwaipilot/kat-coder-pro:free", - "name": "Kat Coder Pro (free)", - "family": "kat-coder", + "id": "vercel/voyage/voyage-code-3", + "name": "voyage-code-3", + "family": "voyage", "attachment": false, "reasoning": false, - "tool_call": true, - "temperature": true, - "knowledge": "2025-11", - "release_date": "2025-11-10", - "last_updated": "2025-11-10", + "tool_call": false, + "temperature": false, + "release_date": "2024-09", + "last_updated": "2024-09", "modalities": { "input": [ "text" @@ -11312,25 +81577,24 @@ }, "open_weights": false, "cost": { - "input": 0.0, + "input": 0.18, "output": 0.0 }, "limit": { - "context": 256000, - "output": 65536 + "context": 8192, + "output": 1536 } }, { - "id": "openrouter/liquid/lfm-2.5-1.2b-instruct:free", - "name": "LFM2.5-1.2B-Instruct (free)", - "family": "liquid", + "id": "vercel/voyage/voyage-finance-2", + "name": "voyage-finance-2", + "family": "voyage", "attachment": false, "reasoning": false, "tool_call": false, - "temperature": true, - "knowledge": "2025-06", - "release_date": "2026-01-20", - "last_updated": "2026-01-28", + "temperature": false, + "release_date": "2024-03", + "last_updated": "2024-03", "modalities": { "input": [ "text" @@ -11339,27 +81603,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, + "input": 0.12, "output": 0.0 }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 1536 } }, { - "id": "openrouter/liquid/lfm-2.5-1.2b-thinking:free", - "name": "LFM2.5-1.2B-Thinking (free)", - "family": "liquid", + "id": "vercel/voyage/voyage-law-2", + "name": "voyage-law-2", + "family": "voyage", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": false, - "temperature": true, - "knowledge": "2025-06", - "release_date": "2026-01-20", - "last_updated": "2026-01-28", + "temperature": false, + "release_date": "2024-03", + "last_updated": "2024-03", "modalities": { "input": [ "text" @@ -11368,27 +81631,58 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, + "input": 0.12, "output": 0.0 }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 1536 } }, { - "id": "openrouter/meta-llama/llama-3.1-405b-instruct:free", - "name": "Llama 3.1 405B Instruct (free)", - "family": "llama", + "id": "vercel/xai/grok-2-vision", + "name": "Grok 2 Vision", + "family": "grok", "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, "knowledge": "2024-08", - "release_date": "2024-07-23", - "last_updated": "2025-04-05", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 2.0, + "output": 10.0, + "cache_read": 2.0 + }, + "limit": { + "context": 8192, + "output": 4096 + } + }, + { + "id": "vercel/xai/grok-3", + "name": "Grok 3", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "modalities": { "input": [ "text" @@ -11397,40 +81691,41 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 } }, { - "id": "openrouter/meta-llama/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11B Vision Instruct", - "family": "llama", - "attachment": true, + "id": "vercel/xai/grok-3-fast", + "name": "Grok 3 Fast", + "family": "grok", + "attachment": false, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 5.0, + "output": 25.0, + "cache_read": 1.25 }, "limit": { "context": 131072, @@ -11438,46 +81733,46 @@ } }, { - "id": "openrouter/meta-llama/llama-3.2-3b-instruct:free", - "name": "Llama 3.2 3B Instruct (free)", - "family": "llama", - "attachment": true, - "reasoning": false, - "tool_call": false, + "id": "vercel/xai/grok-3-mini", + "name": "Grok 3 Mini", + "family": "grok", + "attachment": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 } }, { - "id": "openrouter/meta-llama/llama-3.3-70b-instruct:free", - "name": "Llama 3.3 70B Instruct (free)", - "family": "llama", + "id": "vercel/xai/grok-3-mini-fast", + "name": "Grok 3 Mini Fast", + "family": "grok", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "modalities": { "input": [ "text" @@ -11486,57 +81781,58 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.6, + "output": 4.0, + "cache_read": 0.15 }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 } }, { - "id": "openrouter/meta-llama/llama-4-scout:free", - "name": "Llama 4 Scout (free)", - "family": "llama", - "attachment": true, - "reasoning": false, + "id": "vercel/xai/grok-4", + "name": "Grok 4", + "family": "grok", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 }, "limit": { - "context": 64000, + "context": 256000, "output": 64000 } }, { - "id": "openrouter/microsoft/mai-ds-r1:free", - "name": "MAI DS R1 (free)", - "family": "mai", + "id": "vercel/xai/grok-4-fast", + "name": "Grok 4 Fast Reasoning", + "family": "grok", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-04-21", - "last_updated": "2025-04-21", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "modalities": { "input": [ "text" @@ -11545,26 +81841,28 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 163840, - "output": 163840 + "context": 2000000, + "output": 256000 } }, { - "id": "openrouter/minimax/minimax-01", - "name": "MiniMax-01", - "family": "minimax", + "id": "vercel/xai/grok-4-fast-non", + "name": "Grok 4 Fast (Non-Reasoning)", + "family": "grok", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "modalities": { "input": [ "text", @@ -11574,26 +81872,28 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { "input": 0.2, - "output": 1.1 + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 2000000, + "output": 30000 } }, { - "id": "openrouter/minimax/minimax-m1", - "name": "MiniMax M1", - "family": "minimax", + "id": "vercel/xai/grok-4.1-fast", + "name": "Grok 4.1 Fast Reasoning", + "family": "grok", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "modalities": { "input": [ "text" @@ -11602,26 +81902,28 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.4, - "output": 2.2 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 1000000, - "output": 40000 + "context": 2000000, + "output": 30000 } }, { - "id": "openrouter/minimax/minimax-m2", - "name": "MiniMax M2", - "family": "minimax", + "id": "vercel/xai/grok-4.1-fast-non", + "name": "Grok 4.1 Fast Non-Reasoning", + "family": "grok", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2025-10-23", - "last_updated": "2025-10-23", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "modalities": { "input": [ "text" @@ -11630,28 +81932,28 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.28, - "output": 1.15, - "cache_read": 0.28, - "cache_write": 1.15 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 196600, - "output": 118000 + "context": 2000000, + "output": 30000 } }, { - "id": "openrouter/minimax/minimax-m2.1", - "name": "MiniMax M2.1", - "family": "minimax", + "id": "vercel/xai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "family": "grok", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "modalities": { "input": [ "text" @@ -11660,85 +81962,80 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 10000 } }, { - "id": "openrouter/minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "family": "minimax", + "id": "vercel/xai/grok-imagine-image", + "name": "Grok Imagine Image", + "family": "grok", "attachment": false, - "reasoning": true, - "tool_call": true, + "reasoning": false, + "tool_call": false, "temperature": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-19", "modalities": { "input": [ "text" ], "output": [ - "text" + "text", + "image" ] }, - "open_weights": true, - "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 - }, + "open_weights": false, + "cost": {}, "limit": { - "context": 204800, - "output": 131072 + "context": 0, + "output": 0 } }, { - "id": "openrouter/mistralai/codestral", - "name": "Codestral 2508", - "family": "codestral", + "id": "vercel/xai/grok-imagine-image-pro", + "name": "Grok Imagine Image Pro", + "family": "grok", "attachment": false, "reasoning": false, - "tool_call": true, + "tool_call": false, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "release_date": "2026-01-28", + "last_updated": "2026-02-19", "modalities": { "input": [ "text" ], "output": [ - "text" + "text", + "image" ] }, - "open_weights": true, - "cost": { - "input": 0.3, - "output": 0.9 - }, + "open_weights": false, + "cost": {}, "limit": { - "context": 256000, - "output": 256000 + "context": 0, + "output": 0 } }, { - "id": "openrouter/mistralai/devstral", - "name": "Devstral 2 2512", - "family": "devstral", + "id": "vercel/xiaomi/mimo-v2-flash", + "name": "MiMo V2 Flash", + "family": "mimo", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-12", - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "knowledge": "2024-10", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "modalities": { "input": [ "text" @@ -11747,27 +82044,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.1, + "output": 0.29 }, "limit": { "context": 262144, - "output": 262144 + "output": 32000 } }, { - "id": "openrouter/mistralai/devstral-2512:free", - "name": "Devstral 2 2512 (free)", - "family": "devstral", + "id": "vercel/zai/glm-4.5", + "name": "GLM 4.5", + "family": "glm", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-12", - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "knowledge": "2025-07", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -11778,25 +82075,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.6, + "output": 2.2 }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 131072 } }, { - "id": "openrouter/mistralai/devstral-medium", - "name": "Devstral Medium", - "family": "devstral", + "id": "vercel/zai/glm-4.5-air", + "name": "GLM 4.5 Air", + "family": "glm-air", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -11807,28 +82104,29 @@ }, "open_weights": true, "cost": { - "input": 0.4, - "output": 2.0 + "input": 0.2, + "output": 1.1 }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 96000 } }, { - "id": "openrouter/mistralai/devstral-small", - "name": "Devstral Small 1.1", - "family": "devstral", - "attachment": false, - "reasoning": false, + "id": "vercel/zai/glm-4.5v", + "name": "GLM 4.5V", + "family": "glm", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "knowledge": "2025-08", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -11836,25 +82134,25 @@ }, "open_weights": true, "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.6, + "output": 1.8 }, "limit": { - "context": 131072, - "output": 131072 + "context": 66000, + "output": 66000 } }, { - "id": "openrouter/mistralai/devstral-small-2505:free", - "name": "Devstral Small 2505 (free)", - "family": "devstral", + "id": "vercel/zai/glm-4.6", + "name": "GLM 4.6", + "family": "glm", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ "text" @@ -11865,88 +82163,88 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.45, + "output": 1.8 }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 96000 } }, { - "id": "openrouter/mistralai/mistral-7b-instruct:free", - "name": "Mistral 7B Instruct (free)", - "family": "mistral", - "attachment": false, - "reasoning": false, + "id": "vercel/zai/glm-4.6v", + "name": "GLM-4.6V", + "family": "glm", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-05", - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "knowledge": "2024-10", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.3, + "output": 0.9, + "cache_read": 0.05 }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 24000 } }, { - "id": "openrouter/mistralai/mistral-medium-3", - "name": "Mistral Medium 3", - "family": "mistral-medium", + "id": "vercel/zai/glm-4.6v-flash", + "name": "GLM-4.6V-Flash", + "family": "glm", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2024-10", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "open_weights": false, - "cost": { - "input": 0.4, - "output": 2.0 - }, + "cost": {}, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 24000 } }, { - "id": "openrouter/mistralai/mistral-medium-3.1", - "name": "Mistral Medium 3.1", - "family": "mistral-medium", - "attachment": true, - "reasoning": false, + "id": "vercel/zai/glm-4.7", + "name": "GLM 4.7", + "family": "glm", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "knowledge": "2024-10", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -11954,25 +82252,26 @@ }, "open_weights": false, "cost": { - "input": 0.4, - "output": 2.0 + "input": 0.43, + "output": 1.75, + "cache_read": 0.08 }, "limit": { - "context": 262144, - "output": 262144 + "context": 202752, + "output": 120000 } }, { - "id": "openrouter/mistralai/mistral-nemo:free", - "name": "Mistral Nemo (free)", - "family": "mistral-nemo", + "id": "vercel/zai/glm-4.7-flashx", + "name": "GLM 4.7 FlashX", + "family": "glm-flash", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2024-07-19", - "last_updated": "2024-07-19", + "knowledge": "2025-01", + "release_date": "2025-01", + "last_updated": "2025-01", "modalities": { "input": [ "text" @@ -11983,59 +82282,58 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.06, + "output": 0.4, + "cache_read": 0.01 }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 128000 } }, { - "id": "openrouter/mistralai/mistral-small-3.1-24b-instruct", - "name": "Mistral Small 3.1 24B Instruct", - "family": "mistral-small", - "attachment": true, - "reasoning": false, + "id": "vercel/zai/glm-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "release_date": "2026-02-12", + "last_updated": "2026-02-19", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.0, + "output": 3.2, + "cache_read": 0.2 }, "limit": { - "context": 128000, - "output": 8192 + "context": 202800, + "output": 131072 } }, { - "id": "openrouter/mistralai/mistral-small-3.2-24b-instruct", - "name": "Mistral Small 3.2 24B Instruct", - "family": "mistral-small", - "attachment": true, - "reasoning": false, + "id": "vivgrid/deepseek-v3.2", + "name": "DeepSeek-V3.2", + "family": "deepseek", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -12043,84 +82341,92 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.28, + "output": 0.42 }, "limit": { - "context": 96000, - "output": 8192 + "context": 128000, + "output": 128000 } }, { - "id": "openrouter/mistralai/mistral-small-3.2-24b-instruct:free", - "name": "Mistral Small 3.2 24B (free)", - "family": "mistral-small", + "id": "vivgrid/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "family": "gemini-flash", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.5, + "output": 3.0, + "cache_read": 0.05 }, "limit": { - "context": 96000, - "output": 96000 + "context": 1048576, + "output": 65536 } }, { - "id": "openrouter/moonshotai/kimi-dev-72b:free", - "name": "Kimi Dev 72b (free)", - "family": "kimi", - "attachment": false, - "reasoning": false, + "id": "vivgrid/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "family": "gemini-pro", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 2.0, + "output": 12.0, + "cache_read": 0.2 }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 } }, { - "id": "openrouter/moonshotai/kimi-k2", - "name": "Kimi K2 Instruct 0905", - "family": "kimi", + "id": "vivgrid/glm-5", + "name": "GLM-5", + "family": "glm", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "modalities": { "input": [ "text" @@ -12131,145 +82437,150 @@ }, "open_weights": true, "cost": { - "input": 0.6, - "output": 2.5 + "input": 1.0, + "output": 3.2, + "cache_read": 0.2 }, "limit": { - "context": 262144, - "output": 16384 - } - }, - { - "id": "openrouter/moonshotai/kimi-k2-0905:exacto", - "name": "Kimi K2 Instruct 0905 (exacto)", - "family": "kimi", - "attachment": false, - "reasoning": false, + "context": 202752, + "output": 131000 + } + }, + { + "id": "vivgrid/gpt-5-mini", + "name": "GPT-5 Mini", + "family": "gpt-mini", + "attachment": true, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "temperature": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.25, + "output": 2.0, + "cache_read": 0.03 }, "limit": { - "context": 262144, - "output": 16384 + "context": 272000, + "output": 128000 } }, { - "id": "openrouter/moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "family": "kimi-thinking", + "id": "vivgrid/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "family": "gpt-codex", "attachment": false, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "family": "kimi", - "attachment": true, + "id": "vivgrid/gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "family": "gpt-codex", + "attachment": false, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "temperature": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 3.0, - "cache_read": 0.1 + "input": 1.25, + "output": 10.0, + "cache_read": 0.125 }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/moonshotai/kimi-k2:free", - "name": "Kimi K2 (free)", - "family": "kimi", + "id": "vivgrid/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "family": "gpt-codex", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "temperature": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.75, + "output": 14.0, + "cache_read": 0.175 }, "limit": { - "context": 32800, - "output": 32800 + "context": 400000, + "output": 128000 } }, { - "id": "openrouter/nousresearch/deephermes-3-llama-3-8b-preview", - "name": "DeepHermes 3 Llama 3 8B Preview", - "family": "llama", + "id": "vultr/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "family": "deepseek-thinking", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-02-28", - "last_updated": "2025-02-28", + "knowledge": "2024-10", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "modalities": { "input": [ "text" @@ -12280,25 +82591,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.2, + "output": 0.2 }, "limit": { - "context": 131072, + "context": 121808, "output": 8192 } }, { - "id": "openrouter/nousresearch/hermes-3-llama-3.1-405b:free", - "name": "Hermes 3 405B Instruct (free)", - "family": "hermes", + "id": "vultr/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "family": "qwen", "attachment": false, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-08-16", - "last_updated": "2024-08-16", + "knowledge": "2024-10", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "modalities": { "input": [ "text" @@ -12309,25 +82620,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.2, + "output": 0.2 }, "limit": { - "context": 131072, - "output": 131072 + "context": 121808, + "output": 8192 } }, { - "id": "openrouter/nousresearch/hermes-4-405b", - "name": "Hermes 4 405B", - "family": "hermes", + "id": "vultr/gpt-oss-120b", + "name": "GPT OSS 120B", + "family": "gpt-oss", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "knowledge": "2024-10", + "release_date": "2025-06-23", + "last_updated": "2025-06-23", "modalities": { "input": [ "text" @@ -12338,25 +82649,25 @@ }, "open_weights": true, "cost": { - "input": 1.0, - "output": 3.0 + "input": 0.2, + "output": 0.2 }, "limit": { - "context": 131072, - "output": 131072 + "context": 121808, + "output": 8192 } }, { - "id": "openrouter/nousresearch/hermes-4-70b", - "name": "Hermes 4 70B", - "family": "hermes", + "id": "vultr/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "family": "kimi", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "modalities": { "input": [ "text" @@ -12367,25 +82678,25 @@ }, "open_weights": true, "cost": { - "input": 0.13, - "output": 0.4 + "input": 0.2, + "output": 0.2 }, "limit": { - "context": 131072, - "output": 131072 + "context": 58904, + "output": 4096 } }, { - "id": "openrouter/nvidia/nemotron-3-nano-30b-a3b:free", - "name": "Nemotron 3 Nano 30B A3B (free)", - "family": "nemotron", + "id": "vultr/qwen2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-11", - "release_date": "2025-12-14", - "last_updated": "2026-01-31", + "knowledge": "2024-10", + "release_date": "2024-11-06", + "last_updated": "2024-11-06", "modalities": { "input": [ "text" @@ -12396,29 +82707,28 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.2, + "output": 0.2 }, "limit": { - "context": 256000, - "output": 256000 + "context": 12952, + "output": 2048 } }, { - "id": "openrouter/nvidia/nemotron-nano-12b-v2-vl:free", - "name": "Nemotron Nano 12B 2 VL (free)", - "family": "nemotron", + "id": "wandb/Qwen/Qwen3-235B-A22B-Instruct", + "name": "Qwen3 235B A22B Instruct 2507", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-11", - "release_date": "2025-10-28", - "last_updated": "2026-01-31", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -12426,25 +82736,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.1, + "output": 0.1 }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 131072 } }, { - "id": "openrouter/nvidia/nemotron-nano-9b-v2", - "name": "nvidia-nemotron-nano-9b-v2", - "family": "nemotron", + "id": "wandb/Qwen/Qwen3-235B-A22B-Thinking", + "name": "Qwen3-235B-A22B-Thinking-2507", + "family": "qwen", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-09", - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "modalities": { "input": [ "text" @@ -12455,25 +82765,25 @@ }, "open_weights": true, "cost": { - "input": 0.04, - "output": 0.16 + "input": 0.1, + "output": 0.1 }, "limit": { - "context": 131072, + "context": 262144, "output": 131072 } }, { - "id": "openrouter/nvidia/nemotron-nano-9b-v2:free", - "name": "Nemotron Nano 9B V2 (free)", - "family": "nemotron", + "id": "wandb/Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "family": "qwen", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-09", - "release_date": "2025-09-05", - "last_updated": "2025-08-18", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "modalities": { "input": [ "text" @@ -12484,148 +82794,141 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.0, + "output": 1.5 }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 66536 } }, { - "id": "openrouter/openai/gpt-4.1", - "name": "GPT-4.1", - "family": "gpt", - "attachment": true, - "reasoning": false, + "id": "wandb/deepseek-ai/DeepSeek-R1", + "name": "DeepSeek-R1-0528", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 2.0, - "output": 8.0, - "cache_read": 0.5 + "input": 1.35, + "output": 5.4 }, "limit": { - "context": 1047576, - "output": 32768 + "context": 161000, + "output": 163840 } }, { - "id": "openrouter/openai/gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "family": "gpt-mini", - "attachment": true, + "id": "wandb/deepseek-ai/DeepSeek-V3", + "name": "DeepSeek-V3-0324", + "family": "deepseek", + "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-10", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 1.14, + "output": 2.75 }, "limit": { - "context": 1047576, - "output": 32768 + "context": 161000, + "output": 8192 } }, { - "id": "openrouter/openai/gpt-4o-mini", - "name": "GPT-4o-mini", - "family": "gpt-mini", - "attachment": true, - "reasoning": false, + "id": "wandb/meta-llama/Llama-3.1-8B-Instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "family": "llama", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.22, + "output": 0.22 }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 } }, { - "id": "openrouter/openai/gpt-5", - "name": "GPT-5", - "family": "gpt", - "attachment": true, + "id": "wandb/meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "family": "llama", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.25, - "output": 10.0 + "input": 0.71, + "output": 0.71 }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 } }, { - "id": "openrouter/openai/gpt-5-chat", - "name": "GPT-5 Chat (latest)", - "family": "gpt-codex", - "attachment": true, + "id": "wandb/meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "family": "llama", + "attachment": false, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "modalities": { "input": [ "text", @@ -12635,95 +82938,88 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.25, - "output": 10.0 + "input": 0.17, + "output": 0.66 }, "limit": { - "context": 400000, - "output": 128000 + "context": 64000, + "output": 8192 } }, { - "id": "openrouter/openai/gpt-5-codex", - "name": "GPT-5 Codex", - "family": "gpt-codex", - "attachment": true, + "id": "wandb/microsoft/Phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "family": "phi", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10-01", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 0.08, + "output": 0.35 }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 } }, { - "id": "openrouter/openai/gpt-5-image", - "name": "GPT-5 Image", - "family": "gpt", - "attachment": true, - "reasoning": true, + "id": "wandb/moonshotai/Kimi-K2-Instruct", + "name": "Kimi-K2-Instruct", + "family": "kimi", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-10-01", - "release_date": "2025-10-14", - "last_updated": "2025-10-14", + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 5.0, - "output": 10.0, - "cache_read": 1.25 + "input": 1.35, + "output": 4.0 }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 } }, { - "id": "openrouter/openai/gpt-5-mini", - "name": "GPT-5 Mini", - "family": "gpt-mini", - "attachment": true, - "reasoning": true, + "id": "x-ai/grok-2", + "name": "Grok 2 (1212)", + "family": "grok", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-08", + "release_date": "2024-12-12", + "last_updated": "2024-12-12", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -12731,25 +83027,26 @@ }, "open_weights": false, "cost": { - "input": 0.25, - "output": 2.0 + "input": 2.0, + "output": 10.0, + "cache_read": 2.0 }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 } }, { - "id": "openrouter/openai/gpt-5-nano", - "name": "GPT-5 Nano", - "family": "gpt-nano", + "id": "x-ai/grok-2-vision", + "name": "Grok 2 Vision Latest", + "family": "grok", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "modalities": { "input": [ "text", @@ -12761,29 +83058,29 @@ }, "open_weights": false, "cost": { - "input": 0.05, - "output": 0.4 + "input": 2.0, + "output": 10.0, + "cache_read": 2.0 }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 4096 } }, { - "id": "openrouter/openai/gpt-5-pro", - "name": "GPT-5 Pro", - "family": "gpt-pro", - "attachment": true, - "reasoning": true, - "tool_call": true, - "temperature": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "id": "x-ai/grok-3", + "name": "Grok 3 Latest", + "family": "grok", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -12791,29 +83088,29 @@ }, "open_weights": false, "cost": { - "input": 15.0, - "output": 120.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 }, "limit": { - "context": 400000, - "output": 272000 + "context": 131072, + "output": 8192 } }, { - "id": "openrouter/openai/gpt-5.1", - "name": "GPT-5.1", - "family": "gpt", - "attachment": true, - "reasoning": true, + "id": "x-ai/grok-3-fast", + "name": "Grok 3 Fast Latest", + "family": "grok", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -12821,30 +83118,29 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 5.0, + "output": 25.0, + "cache_read": 1.25 }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 } }, { - "id": "openrouter/openai/gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "family": "gpt-codex", - "attachment": true, + "id": "x-ai/grok-3-mini", + "name": "Grok 3 Mini Latest", + "family": "grok", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -12852,30 +83148,29 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 } }, { - "id": "openrouter/openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "family": "gpt-codex", - "attachment": true, + "id": "x-ai/grok-3-mini-fast", + "name": "Grok 3 Mini Fast", + "family": "grok", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -12883,30 +83178,29 @@ }, "open_weights": false, "cost": { - "input": 1.25, - "output": 10.0, - "cache_read": 0.125 + "input": 0.6, + "output": 4.0, + "cache_read": 0.15 }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 } }, { - "id": "openrouter/openai/gpt-5.1-codex-max", - "name": "GPT-5.1-Codex-Max", - "family": "gpt-codex", - "attachment": true, + "id": "x-ai/grok-4", + "name": "Grok 4", + "family": "grok", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -12914,26 +83208,26 @@ }, "open_weights": false, "cost": { - "input": 1.1, - "output": 9.0, - "cache_read": 0.11 + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 64000 } }, { - "id": "openrouter/openai/gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-Mini", - "family": "gpt-codex", + "id": "x-ai/grok-4-fast", + "name": "Grok 4 Fast", + "family": "grok", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "modalities": { "input": [ "text", @@ -12945,26 +83239,26 @@ }, "open_weights": false, "cost": { - "input": 0.25, - "output": 2.0, - "cache_read": 0.025 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 400000, - "output": 100000 + "context": 2000000, + "output": 30000 } }, { - "id": "openrouter/openai/gpt-5.2", - "name": "GPT-5.2", - "family": "gpt", + "id": "x-ai/grok-4-fast-non", + "name": "Grok 4 Fast (Non-Reasoning)", + "family": "grok", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "modalities": { "input": [ "text", @@ -12976,26 +83270,26 @@ }, "open_weights": false, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 400000, - "output": 128000 + "context": 2000000, + "output": 30000 } }, { - "id": "openrouter/openai/gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "family": "gpt-codex", + "id": "x-ai/grok-4.1-fast", + "name": "Grok 4.1 Fast", + "family": "grok", "attachment": true, "reasoning": true, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "temperature": true, + "knowledge": "2025-07", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "modalities": { "input": [ "text", @@ -13007,26 +83301,26 @@ }, "open_weights": false, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 128000, - "output": 16384 + "context": 2000000, + "output": 30000 } }, { - "id": "openrouter/openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "family": "gpt-codex", + "id": "x-ai/grok-4.1-fast-non", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "family": "grok", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "knowledge": "2025-07", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "modalities": { "input": [ "text", @@ -13038,30 +83332,29 @@ }, "open_weights": false, "cost": { - "input": 1.75, - "output": 14.0, - "cache_read": 0.175 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 400000, - "output": 128000 + "context": 2000000, + "output": 30000 } }, { - "id": "openrouter/openai/gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "family": "gpt-pro", - "attachment": true, - "reasoning": true, + "id": "x-ai/grok-beta", + "name": "Grok Beta", + "family": "grok-beta", + "attachment": false, + "reasoning": false, "tool_call": true, - "temperature": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "temperature": true, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -13069,24 +83362,26 @@ }, "open_weights": false, "cost": { - "input": 21.0, - "output": 168.0 + "input": 5.0, + "output": 15.0, + "cache_read": 5.0 }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 4096 } }, { - "id": "openrouter/openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "family": "gpt-oss", + "id": "x-ai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "family": "grok", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "modalities": { "input": [ "text" @@ -13095,54 +83390,59 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.072, - "output": 0.28 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 10000 } }, { - "id": "openrouter/openai/gpt-oss-120b:exacto", - "name": "GPT OSS 120B (exacto)", - "family": "gpt-oss", - "attachment": false, - "reasoning": true, + "id": "x-ai/grok-vision-beta", + "name": "Grok Vision Beta", + "family": "grok-vision", + "attachment": true, + "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.05, - "output": 0.24 + "input": 5.0, + "output": 15.0, + "cache_read": 5.0 }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 4096 } }, { - "id": "openrouter/openai/gpt-oss-120b:free", - "name": "gpt-oss-120b (free)", - "family": "gpt-oss", + "id": "xiaomi/mimo-v2-flash", + "name": "MiMo-V2-Flash", + "family": "mimo", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-12-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "modalities": { "input": [ "text" @@ -13153,24 +83453,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.07, + "output": 0.21 }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 32000 } }, { - "id": "openrouter/openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "family": "gpt-oss", + "id": "zai-coding-plan/glm-4.5", + "name": "GLM-4.5", + "family": "glm", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -13181,24 +83482,27 @@ }, "open_weights": true, "cost": { - "input": 0.05, - "output": 0.2 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { "context": 131072, - "output": 32768 + "output": 98304 } }, { - "id": "openrouter/openai/gpt-oss-20b:free", - "name": "gpt-oss-20b (free)", - "family": "gpt-oss", + "id": "zai-coding-plan/glm-4.5-air", + "name": "GLM-4.5-Air", + "family": "glm-air", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-08-05", - "last_updated": "2026-01-31", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -13210,23 +83514,26 @@ "open_weights": true, "cost": { "input": 0.0, - "output": 0.0 + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { "context": 131072, - "output": 32768 + "output": 98304 } }, { - "id": "openrouter/openai/gpt-oss-safeguard-20b", - "name": "GPT OSS Safeguard 20B", - "family": "gpt-oss", + "id": "zai-coding-plan/glm-4.5-flash", + "name": "GLM-4.5-Flash", + "family": "glm-flash", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -13235,118 +83542,122 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { "context": 131072, - "output": 65536 + "output": 98304 } }, { - "id": "openrouter/openai/o4-mini", - "name": "o4 Mini", - "family": "o-mini", + "id": "zai-coding-plan/glm-4.5v", + "name": "GLM-4.5V", + "family": "glm", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-06", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 200000, - "output": 100000 + "context": 64000, + "output": 16384 } }, { - "id": "openrouter/openrouter/sherlock-dash-alpha", - "name": "Sherlock Dash Alpha", - "family": "sherlock", - "attachment": true, - "reasoning": false, + "id": "zai-coding-plan/glm-4.6", + "name": "GLM-4.6", + "family": "glm", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-11", - "release_date": "2025-11-15", - "last_updated": "2025-12-14", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { "input": 0.0, - "output": 0.0 + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 1840000, - "output": 0 + "context": 204800, + "output": 131072 } }, { - "id": "openrouter/openrouter/sherlock-think-alpha", - "name": "Sherlock Think Alpha", - "family": "sherlock", + "id": "zai-coding-plan/glm-4.6v", + "name": "GLM-4.6V", + "family": "glm", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-11", - "release_date": "2025-11-15", - "last_updated": "2025-12-14", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { "input": 0.0, "output": 0.0 }, "limit": { - "context": 1840000, - "output": 0 + "context": 128000, + "output": 32768 } }, { - "id": "openrouter/qwen/qwen-2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "family": "qwen", + "id": "zai-coding-plan/glm-4.7", + "name": "GLM-4.7", + "family": "glm", "attachment": false, - "reasoning": false, - "tool_call": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2024-11-11", - "last_updated": "2024-11-11", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "modalities": { "input": [ "text" @@ -13358,28 +83669,29 @@ "open_weights": true, "cost": { "input": 0.0, - "output": 0.0 + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 32768, - "output": 8192 + "context": 204800, + "output": 131072 } }, { - "id": "openrouter/qwen/qwen-2.5-vl-7b-instruct:free", - "name": "Qwen2.5-VL 7B Instruct (free)", - "family": "qwen", - "attachment": true, - "reasoning": false, + "id": "zai-coding-plan/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "family": "glm-flash", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-02", - "release_date": "2024-08-28", - "last_updated": "2024-08-28", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -13388,29 +83700,29 @@ "open_weights": true, "cost": { "input": 0.0, - "output": 0.0 + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 131072 } }, { - "id": "openrouter/qwen/qwen2.5-vl-32b-instruct:free", - "name": "Qwen2.5 VL 32B Instruct (free)", - "family": "qwen", - "attachment": true, - "reasoning": false, + "id": "zai-coding-plan/glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "family": "glm-flash", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-03", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -13418,59 +83730,60 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0.0 }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 131072 } }, { - "id": "openrouter/qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen2.5 VL 72B Instruct", - "family": "qwen", - "attachment": true, - "reasoning": false, - "tool_call": false, + "id": "zai-coding-plan/glm-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { "input": 0.0, - "output": 0.0 + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 32768, - "output": 8192 + "context": 204800, + "output": 131072 } }, { - "id": "openrouter/qwen/qwen2.5-vl-72b-instruct:free", - "name": "Qwen2.5 VL 72B Instruct (free)", - "family": "qwen", - "attachment": true, - "reasoning": false, + "id": "zai/glm-4.5", + "name": "GLM-4.5", + "family": "glm", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-02", - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -13478,25 +83791,27 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0.0 }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 98304 } }, { - "id": "openrouter/qwen/qwen3-14b:free", - "name": "Qwen3 14B (free)", - "family": "qwen", + "id": "zai/glm-4.5-air", + "name": "GLM-4.5-Air", + "family": "glm-air", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -13507,25 +83822,27 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0.0 }, "limit": { - "context": 40960, - "output": 40960 + "context": 131072, + "output": 98304 } }, { - "id": "openrouter/qwen/qwen3-235b-a22b-07-25", - "name": "Qwen3 235B A22B Instruct 2507", - "family": "qwen", + "id": "zai/glm-4.5-flash", + "name": "GLM-4.5-Flash", + "family": "glm-flash", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -13536,28 +83853,32 @@ }, "open_weights": true, "cost": { - "input": 0.15, - "output": 0.85 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 262144, - "output": 131072 + "context": 131072, + "output": 98304 } }, { - "id": "openrouter/qwen/qwen3-235b-a22b-07-25:free", - "name": "Qwen3 235B A22B Instruct 2507 (free)", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "zai/glm-4.5v", + "name": "GLM-4.5V", + "family": "glm", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -13565,25 +83886,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.6, + "output": 1.8 }, "limit": { - "context": 262144, - "output": 131072 + "context": 64000, + "output": 16384 } }, { - "id": "openrouter/qwen/qwen3-235b-a22b-thinking", - "name": "Qwen3 235B A22B Thinking 2507", - "family": "qwen", + "id": "zai/glm-4.6", + "name": "GLM-4.6", + "family": "glm", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ "text" @@ -13594,28 +83915,32 @@ }, "open_weights": true, "cost": { - "input": 0.078, - "output": 0.312 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0.0 }, "limit": { - "context": 262144, - "output": 81920 + "context": 204800, + "output": 131072 } }, { - "id": "openrouter/qwen/qwen3-235b-a22b:free", - "name": "Qwen3 235B A22B (free)", - "family": "qwen", - "attachment": false, + "id": "zai/glm-4.6v", + "name": "GLM-4.6V", + "family": "glm", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -13623,25 +83948,25 @@ }, "open_weights": true, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.3, + "output": 0.9 }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 32768 } }, { - "id": "openrouter/qwen/qwen3-30b-a3b-instruct", - "name": "Qwen3 30B A3B Instruct 2507", - "family": "qwen", + "id": "zai/glm-4.7", + "name": "GLM-4.7", + "family": "glm", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "modalities": { "input": [ "text" @@ -13652,25 +83977,27 @@ }, "open_weights": true, "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0.0 }, "limit": { - "context": 262000, - "output": 262000 + "context": 204800, + "output": 131072 } }, { - "id": "openrouter/qwen/qwen3-30b-a3b-thinking", - "name": "Qwen3 30B A3B Thinking 2507", - "family": "qwen", + "id": "zai/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "family": "glm-flash", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "modalities": { "input": [ "text" @@ -13681,25 +84008,26 @@ }, "open_weights": true, "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 131072 } }, { - "id": "openrouter/qwen/qwen3-30b-a3b:free", - "name": "Qwen3 30B A3B (free)", - "family": "qwen", + "id": "zai/glm-5", + "name": "GLM-5", + "family": "glm", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "modalities": { "input": [ "text" @@ -13708,175 +84036,191 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.0, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0.0 }, "limit": { - "context": 40960, - "output": 40960 + "context": 204800, + "output": 131072 } }, { - "id": "openrouter/qwen/qwen3-32b:free", - "name": "Qwen3 32B (free)", - "family": "qwen", - "attachment": false, - "reasoning": true, + "id": "zenmux/anthropic/claude-3.5-haiku", + "name": "Claude 3.5 Haiku", + "attachment": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2025-01-01", + "release_date": "2024-11-04", + "last_updated": "2024-11-04", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.8, + "output": 4.0, + "cache_read": 0.08, + "cache_write": 1.0 }, "limit": { - "context": 40960, - "output": 40960 + "context": 200000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-4b:free", - "name": "Qwen3 4B (free)", - "family": "qwen", - "attachment": false, - "reasoning": true, + "id": "zenmux/anthropic/claude-3.5-sonnet", + "name": "Claude 3.5 Sonnet (Retiring Soon)", + "attachment": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-04-30", - "last_updated": "2025-07-23", + "knowledge": "2025-01-01", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 40960, - "output": 40960 + "context": 200000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-8b:free", - "name": "Qwen3 8B (free)", - "family": "qwen", - "attachment": false, + "id": "zenmux/anthropic/claude-3.7-sonnet", + "name": "Claude 3.7 Sonnet", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2025-01-01", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 40960, - "output": 40960 + "context": 200000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-coder", - "name": "Qwen3 Coder", - "family": "qwen", - "attachment": false, + "id": "zenmux/anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-01-01", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "modalities": { "input": [ + "image", "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.0, + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 }, "limit": { - "context": 262144, - "output": 66536 + "context": 200000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "zenmux/anthropic/claude-opus-4", + "name": "Claude Opus 4", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "knowledge": "2025-01-01", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "modalities": { "input": [ - "text" + "image", + "text", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.07, - "output": 0.27 + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 }, "limit": { - "context": 160000, - "output": 65536 + "context": 200000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "zenmux/anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-01-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "modalities": { "input": [ - "text" + "image", + "text", + "pdf" ], "output": [ "text" @@ -13884,85 +84228,94 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 1.5 + "input": 15.0, + "output": 75.0, + "cache_read": 1.5, + "cache_write": 18.75 }, "limit": { - "context": 128000, - "output": 66536 + "context": 200000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-coder:exacto", - "name": "Qwen3 Coder (exacto)", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "zenmux/anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-01-01", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "modalities": { "input": [ + "pdf", + "image", "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.38, - "output": 1.53 + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-coder:free", - "name": "Qwen3 Coder 480B A35B Instruct (free)", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "zenmux/anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-01-01", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "modalities": { "input": [ + "image", "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 5.0, + "output": 25.0, + "cache_read": 0.5, + "cache_write": 6.25 }, "limit": { - "context": 262144, - "output": 66536 + "context": 1000000, + "output": 128000 } }, { - "id": "openrouter/qwen/qwen3-max", - "name": "Qwen3 Max", - "family": "qwen", - "attachment": false, + "id": "zenmux/anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-01-01", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "modalities": { "input": [ - "text" + "image", + "text", + "pdf" ], "output": [ "text" @@ -13970,112 +84323,119 @@ }, "open_weights": false, "cost": { - "input": 1.2, - "output": 6.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 262144, - "output": 32768 + "context": 1000000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "zenmux/anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "knowledge": "2025-01-01", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.14, - "output": 1.4 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-next-80b-a3b-instruct:free", - "name": "Qwen3 Next 80B A3B Instruct (free)", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "zenmux/anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "knowledge": "2025-01-01", + "release_date": "2026-02-18", + "last_updated": "2026-02-18", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.3, + "cache_write": 3.75 }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "family": "qwen", - "attachment": false, + "id": "zenmux/baidu/ernie-5.0-thinking-preview", + "name": "ERNIE 5.0", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "knowledge": "2025-01-01", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.84, + "output": 3.37 }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 64000 } }, { - "id": "openrouter/qwen/qwq-32b:free", - "name": "QwQ 32B (free)", - "family": "qwen", + "id": "zenmux/deepseek/deepseek-chat", + "name": "DeepSeek-V3.2 (Non-thinking Mode)", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-03", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "knowledge": "2025-01-01", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "modalities": { "input": [ "text" @@ -14084,27 +84444,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.28, + "output": 0.42, + "cache_read": 0.03 }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 64000 } - }, - { - "id": "openrouter/rekaai/reka-flash-3", - "name": "Reka Flash 3", - "family": "reka", + }, + { + "id": "zenmux/deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-10", - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "knowledge": "2025-01-01", + "release_date": "2025-12-05", + "last_updated": "2025-12-05", "modalities": { "input": [ "text" @@ -14113,27 +84473,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.28, + "output": 0.43 }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 64000 } }, { - "id": "openrouter/sarvamai/sarvam-m:free", - "name": "Sarvam-M (free)", - "family": "sarvam", + "id": "zenmux/deepseek/deepseek-v3.2-exp", + "name": "DeepSeek-V3.2-Exp", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-05", - "release_date": "2025-05-25", - "last_updated": "2025-05-25", + "knowledge": "2025-01-01", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "modalities": { "input": [ "text" @@ -14142,176 +84501,193 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.22, + "output": 0.33 }, "limit": { - "context": 32768, - "output": 32768 + "context": 163000, + "output": 64000 } }, { - "id": "openrouter/sourceful/riverflow-v2-fast-preview", - "name": "Riverflow V2 Fast Preview", - "family": "sourceful", - "attachment": false, - "reasoning": false, - "tool_call": false, + "id": "zenmux/google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "attachment": true, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-12-08", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "modalities": { "input": [ + "pdf", + "image", "text", - "image" + "audio" ], "output": [ - "image" + "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.07, + "cache_write": 1.0 }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048000, + "output": 64000 } }, { - "id": "openrouter/sourceful/riverflow-v2-max-preview", - "name": "Riverflow V2 Max Preview", - "family": "sourceful", - "attachment": false, + "id": "zenmux/google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "attachment": true, "reasoning": false, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-12-08", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "modalities": { "input": [ + "pdf", + "image", "text", - "image" + "audio" ], "output": [ - "image" + "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03, + "cache_write": 1.0 }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048000, + "output": 64000 } }, { - "id": "openrouter/sourceful/riverflow-v2-standard-preview", - "name": "Riverflow V2 Standard Preview", - "family": "sourceful", - "attachment": false, - "reasoning": false, - "tool_call": false, + "id": "zenmux/google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "attachment": true, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2025-06", - "release_date": "2025-12-08", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "modalities": { "input": [ + "pdf", + "image", "text", - "image" + "audio", + "video" ], "output": [ - "image" + "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.25, + "output": 10.0, + "cache_read": 0.31, + "cache_write": 4.5 }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048000, + "output": 64000 } }, { - "id": "openrouter/stepfun/step-3.5-flash", - "name": "Step 3.5 Flash", - "family": "step", - "attachment": false, + "id": "zenmux/google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "knowledge": "2025-01-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "modalities": { "input": [ - "text" + "text", + "image", + "pdf", + "audio" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 0.5, + "output": 3.0, + "cache_read": 0.05, + "cache_write": 1.0 }, "limit": { - "context": 256000, - "output": 256000 + "context": 1048000, + "output": 64000 } }, { - "id": "openrouter/stepfun/step-3.5-flash:free", - "name": "Step 3.5 Flash (free)", - "family": "step", - "attachment": false, + "id": "zenmux/google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "knowledge": "2025-01-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "modalities": { "input": [ - "text" + "text", + "image", + "pdf", + "audio", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 2.0, + "output": 12.0, + "cache_read": 0.2, + "cache_write": 4.5 }, "limit": { - "context": 256000, - "output": 256000 + "context": 1048000, + "output": 64000 } }, { - "id": "openrouter/thudm/glm-z1-32b:free", - "name": "GLM Z1 32B (free)", - "family": "glm-z", + "id": "zenmux/inclusionai/ling-1t", + "name": "Ling-1T", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "knowledge": "2025-01-01", + "release_date": "2025-10-09", + "last_updated": "2025-10-09", "modalities": { "input": [ "text" @@ -14320,27 +84696,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.56, + "output": 2.24, + "cache_read": 0.11 }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 64000 } }, { - "id": "openrouter/tngtech/deepseek-r1t2-chimera:free", - "name": "DeepSeek R1T2 Chimera (free)", - "family": "deepseek-thinking", + "id": "zenmux/inclusionai/ring-1t", + "name": "Ring-1T", "attachment": false, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "knowledge": "2025-01-01", + "release_date": "2025-10-12", + "last_updated": "2025-10-12", "modalities": { "input": [ "text" @@ -14349,27 +84725,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.56, + "output": 2.24, + "cache_read": 0.11 }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 64000 } }, { - "id": "openrouter/tngtech/tng-r1t-chimera:free", - "name": "R1T Chimera (free)", - "family": "tngtech", + "id": "zenmux/kuaishou/kat-coder-pro-v1", + "name": "KAT-Coder-Pro-V1", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-11-26", - "last_updated": "2026-01-31", + "knowledge": "2025-01-01", + "release_date": "2025-10-23", + "last_updated": "2025-10-23", "modalities": { "input": [ "text" @@ -14378,27 +84754,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "limit": { - "context": 163840, - "output": 163840 + "context": 256000, + "output": 64000 } }, { - "id": "openrouter/x-ai/grok-3", - "name": "Grok 3", - "family": "grok", + "id": "zenmux/kuaishou/kat-coder-pro-v1-free", + "name": "KAT-Coder-Pro-V1 Free", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-01-01", + "release_date": "2025-10-23", + "last_updated": "2025-10-23", "modalities": { "input": [ "text" @@ -14409,27 +84785,24 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.75, - "cache_write": 15.0 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 64000 } }, { - "id": "openrouter/x-ai/grok-3-beta", - "name": "Grok 3 Beta", - "family": "grok", + "id": "zenmux/minimax/minimax-m2", + "name": "MiniMax M2", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-01-01", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "modalities": { "input": [ "text" @@ -14440,27 +84813,26 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.75, - "cache_write": 15.0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.38 }, "limit": { - "context": 131072, - "output": 8192 + "context": 204000, + "output": 64000 } }, { - "id": "openrouter/x-ai/grok-3-mini", - "name": "Grok 3 Mini", - "family": "grok", + "id": "zenmux/minimax/minimax-m2.1", + "name": "MiniMax M2.1", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-01-01", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "modalities": { "input": [ "text" @@ -14472,26 +84844,25 @@ "open_weights": false, "cost": { "input": 0.3, - "output": 0.5, - "cache_read": 0.075, - "cache_write": 0.5 + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.38 }, "limit": { - "context": 131072, - "output": 8192 + "context": 204000, + "output": 64000 } }, { - "id": "openrouter/x-ai/grok-3-mini-beta", - "name": "Grok 3 Mini Beta", - "family": "grok", + "id": "zenmux/minimax/minimax-m2.5", + "name": "MiniMax M2.5", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-01-01", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "modalities": { "input": [ "text" @@ -14503,26 +84874,25 @@ "open_weights": false, "cost": { "input": 0.3, - "output": 0.5, - "cache_read": 0.075, - "cache_write": 0.5 + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 } }, { - "id": "openrouter/x-ai/grok-4", - "name": "Grok 4", - "family": "grok", + "id": "zenmux/minimax/minimax-m2.5-lightning", + "name": "MiniMax: MiniMax M2.5 highspeed", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-01-01", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "modalities": { "input": [ "text" @@ -14533,31 +84903,29 @@ }, "open_weights": false, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.75, - "cache_write": 15.0 + "input": 0.6, + "output": 4.8, + "cache_read": 0.06, + "cache_write": 0.75 }, "limit": { - "context": 256000, - "output": 64000 + "context": 204800, + "output": 131072 } }, { - "id": "openrouter/x-ai/grok-4-fast", - "name": "Grok 4 Fast", - "family": "grok", + "id": "zenmux/moonshotai/kimi-k2", + "name": "Kimi K2 0905", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "knowledge": "2025-01-01", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -14565,31 +84933,28 @@ }, "open_weights": false, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05, - "cache_write": 0.05 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "limit": { - "context": 2000000, - "output": 30000 + "context": 262000, + "output": 64000 } }, { - "id": "openrouter/x-ai/grok-4.1-fast", - "name": "Grok 4.1 Fast", - "family": "grok", + "id": "zenmux/moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-01-01", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -14597,27 +84962,25 @@ }, "open_weights": false, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05, - "cache_write": 0.05 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "limit": { - "context": 2000000, - "output": 30000 + "context": 262000, + "output": 64000 } }, { - "id": "openrouter/x-ai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "family": "grok", + "id": "zenmux/moonshotai/kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-08", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "knowledge": "2025-01-01", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "modalities": { "input": [ "text" @@ -14628,291 +84991,301 @@ }, "open_weights": false, "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 1.15, + "output": 8.0, + "cache_read": 0.15 }, "limit": { - "context": 256000, - "output": 10000 + "context": 262000, + "output": 64000 } }, { - "id": "openrouter/xiaomi/mimo-v2-flash", - "name": "MiMo-V2-Flash", - "family": "mimo", - "attachment": false, + "id": "zenmux/moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-12", - "release_date": "2025-12-14", - "last_updated": "2025-12-14", + "knowledge": "2025-01-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 0.58, + "output": 3.02, + "cache_read": 0.1 }, "limit": { - "context": 262144, - "output": 65536 + "context": 262000, + "output": 64000 } }, { - "id": "openrouter/z-ai/glm-4.5", - "name": "GLM 4.5", - "family": "glm", - "attachment": false, + "id": "zenmux/openai/gpt-5", + "name": "GPT-5", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-01-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 2.2 + "input": 1.25, + "output": 10.0, + "cache_read": 0.12 }, "limit": { - "context": 128000, - "output": 96000 + "context": 400000, + "output": 64000 } }, { - "id": "openrouter/z-ai/glm-4.5-air", - "name": "GLM 4.5 Air", - "family": "glm-air", - "attachment": false, + "id": "zenmux/openai/gpt-5-codex", + "name": "GPT-5 Codex", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-01-01", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.2, - "output": 1.1 + "input": 1.25, + "output": 10.0, + "cache_read": 0.12 }, "limit": { - "context": 128000, - "output": 96000 + "context": 400000, + "output": 64000 } }, { - "id": "openrouter/z-ai/glm-4.5-air:free", - "name": "GLM 4.5 Air (free)", - "family": "glm-air", - "attachment": false, + "id": "zenmux/openai/gpt-5.1", + "name": "GPT-5.1", + "attachment": true, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-01-01", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "modalities": { "input": [ - "text" + "image", + "text", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.0, - "output": 0.0 + "input": 1.25, + "output": 10.0, + "cache_read": 0.12 }, "limit": { - "context": 128000, - "output": 96000 + "context": 400000, + "output": 64000 } }, { - "id": "openrouter/z-ai/glm-4.5v", - "name": "GLM 4.5V", - "family": "glm", + "id": "zenmux/openai/gpt-5.1-chat", + "name": "GPT-5.1 Chat", "attachment": true, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "knowledge": "2025-01-01", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "modalities": { "input": [ - "text", + "pdf", "image", - "video" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 1.8 + "input": 1.25, + "output": 10.0, + "cache_read": 0.12 }, "limit": { - "context": 64000, - "output": 16384 + "context": 128000, + "output": 64000 } }, { - "id": "openrouter/z-ai/glm-4.6", - "name": "GLM 4.6", - "family": "glm", - "attachment": false, + "id": "zenmux/openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "attachment": true, "reasoning": true, - "tool_call": true, - "temperature": true, - "knowledge": "2025-09", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "tool_call": true, + "temperature": true, + "knowledge": "2025-01-01", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 1.25, + "output": 10.0, + "cache_read": 0.12 }, "limit": { - "context": 200000, - "output": 128000 + "context": 400000, + "output": 64000 } }, { - "id": "openrouter/z-ai/glm-4.6:exacto", - "name": "GLM 4.6 (exacto)", - "family": "glm", - "attachment": false, + "id": "zenmux/openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-09", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-01-01", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "modalities": { "input": [ + "image", "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 1.9, - "cache_read": 0.11 + "input": 0.25, + "output": 2.0, + "cache_read": 0.03 }, "limit": { - "context": 200000, - "output": 128000 + "context": 400000, + "output": 64000 } }, { - "id": "openrouter/z-ai/glm-4.7", - "name": "GLM-4.7", - "family": "glm", - "attachment": false, + "id": "zenmux/openai/gpt-5.2", + "name": "GPT-5.2", + "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "temperature": false, + "knowledge": "2025-01-01", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "modalities": { "input": [ - "text" + "image", + "text", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 1.75, + "output": 14.0, + "cache_read": 0.17 }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 64000 } }, { - "id": "openrouter/z-ai/glm-4.7-flash", - "name": "GLM-4.7", - "family": "glm", - "attachment": false, + "id": "zenmux/openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "attachment": true, "reasoning": true, "tool_call": true, - "temperature": true, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "temperature": false, + "knowledge": "2025-01-01", + "release_date": "2026-01-15", + "last_updated": "2026-01-15", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.07, - "output": 0.4 + "input": 1.75, + "output": 14.0, + "cache_read": 0.17 }, "limit": { - "context": 200000, - "output": 65535 + "context": 400000, + "output": 64000 } }, { - "id": "openrouter/z-ai/glm-5", - "name": "GLM-5", - "family": "glm", + "id": "zenmux/qwen/qwen3-coder-plus", + "name": "Qwen3-Coder-Plus", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-01-01", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "modalities": { "input": [ "text" @@ -14921,31 +85294,31 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { "input": 1.0, - "output": 3.2, - "cache_read": 0.2 + "output": 5.0, + "cache_read": 0.1, + "cache_write": 1.25 }, "limit": { - "context": 202752, - "output": 131000 + "context": 1000000, + "output": 64000 } }, { - "id": "venice/claude-opus-4.6", - "name": "Claude Opus 4.6", - "family": "claude-opus", - "attachment": true, + "id": "zenmux/qwen/qwen3-max", + "name": "Qwen3-Max-Thinking", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-01-01", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -14953,32 +85326,28 @@ }, "open_weights": false, "cost": { - "input": 6.0, - "output": 30.0, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 1.2, + "output": 6.0 }, "limit": { - "context": 1000000, - "output": 128000 + "context": 256000, + "output": 64000 } }, { - "id": "venice/claude-opus-45", - "name": "Claude Opus 4.5", - "family": "claude-opus", + "id": "zenmux/stepfun/step-3", + "name": "Step-3", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-03", - "release_date": "2025-12-06", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "modalities": { "input": [ - "text", "image", - "pdf" + "text" ], "output": [ "text" @@ -14986,31 +85355,27 @@ }, "open_weights": false, "cost": { - "input": 6.0, - "output": 30.0, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 0.21, + "output": 0.57 }, "limit": { - "context": 198000, - "output": 49500 + "context": 65536, + "output": 64000 } }, { - "id": "venice/claude-sonnet-45", - "name": "Claude Sonnet 4.5", - "family": "claude-sonnet", - "attachment": true, - "reasoning": true, + "id": "zenmux/stepfun/step-3.5-flash", + "name": "Step 3.5 Flash", + "attachment": false, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-09", - "release_date": "2025-01-15", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -15018,27 +85383,24 @@ }, "open_weights": false, "cost": { - "input": 3.75, - "output": 18.75, - "cache_read": 0.375, - "cache_write": 4.69 + "input": 0.1, + "output": 0.3 }, "limit": { - "context": 198000, - "output": 49500 + "context": 256000, + "output": 64000 } }, { - "id": "venice/deepseek-v3.2", - "name": "DeepSeek V3.2", - "family": "deepseek", + "id": "zenmux/stepfun/step-3.5-flash-free", + "name": "Step 3.5 Flash (Free)", "attachment": false, "reasoning": true, - "tool_call": false, + "tool_call": true, "temperature": true, - "knowledge": "2025-10", - "release_date": "2025-12-04", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "modalities": { "input": [ "text" @@ -15047,35 +85409,31 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.4, - "output": 1.0, - "cache_read": 0.2 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 160000, - "output": 40000 + "context": 256000, + "output": 64000 } }, { - "id": "venice/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "family": "gemini-flash", + "id": "zenmux/volcengine/doubao-seed-1.8", + "name": "Doubao-Seed-1.8", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-12-19", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" @@ -15083,9 +85441,10 @@ }, "open_weights": false, "cost": { - "input": 0.7, - "output": 3.75, - "cache_read": 0.07 + "input": 0.11, + "output": 0.28, + "cache_read": 0.02, + "cache_write": 0.0024 }, "limit": { "context": 256000, @@ -15093,21 +85452,19 @@ } }, { - "id": "venice/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "family": "gemini-pro", + "id": "zenmux/volcengine/doubao-seed-2.0-lite", + "name": "Doubao-Seed-2.0-lite", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-12-02", - "last_updated": "2026-01-28", + "knowledge": "2026-02-14", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ @@ -15116,60 +85473,63 @@ }, "open_weights": false, "cost": { - "input": 2.5, - "output": 15.0, - "cache_read": 0.625 + "input": 0.09, + "output": 0.51, + "cache_read": 0.02, + "cache_write": 0.0024 }, "limit": { - "context": 198000, - "output": 49500 + "context": 256000, + "output": 64000 } }, { - "id": "venice/google-gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "family": "gemma", + "id": "zenmux/volcengine/doubao-seed-2.0-mini", + "name": "Doubao-Seed-2.0-mini", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-11-04", - "last_updated": "2026-01-28", + "knowledge": "2026-02-14", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.12, - "output": 0.2 + "input": 0.03, + "output": 0.28, + "cache_read": 0.01, + "cache_write": 0.0024 }, "limit": { - "context": 198000, - "output": 49500 + "context": 256000, + "output": 64000 } }, { - "id": "venice/grok-41-fast", - "name": "Grok 4.1 Fast", - "family": "grok", + "id": "zenmux/volcengine/doubao-seed-2.0-pro", + "name": "Doubao-Seed-2.0-pro", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-12-01", - "last_updated": "2026-01-28", + "knowledge": "2026-02-14", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -15177,9 +85537,10 @@ }, "open_weights": false, "cost": { - "input": 0.5, - "output": 1.25, - "cache_read": 0.125 + "input": 0.45, + "output": 2.24, + "cache_read": 0.09, + "cache_write": 0.0024 }, "limit": { "context": 256000, @@ -15187,18 +85548,19 @@ } }, { - "id": "venice/grok-code-fast-1", - "name": "Grok Code Fast 1", - "family": "grok", - "attachment": false, + "id": "zenmux/volcengine/doubao-seed-code", + "name": "Doubao-Seed-Code", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-12-01", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-11-11", + "last_updated": "2025-11-11", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -15206,8 +85568,8 @@ }, "open_weights": false, "cost": { - "input": 0.25, - "output": 1.87, + "input": 0.17, + "output": 1.12, "cache_read": 0.03 }, "limit": { @@ -15216,45 +85578,45 @@ } }, { - "id": "venice/hermes-3-llama-3.1-405b", - "name": "Hermes 3 Llama 3.1 405b", - "family": "hermes", - "attachment": false, - "reasoning": false, - "tool_call": false, + "id": "zenmux/x-ai/grok-4", + "name": "Grok 4", + "attachment": true, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-09-25", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "modalities": { "input": [ + "image", "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 1.1, - "output": 3.0 + "input": 3.0, + "output": 15.0, + "cache_read": 0.75 }, "limit": { - "context": 128000, - "output": 32000 + "context": 256000, + "output": 64000 } }, { - "id": "venice/kimi-k2-5", - "name": "Kimi K2.5", - "family": "kimi", + "id": "zenmux/x-ai/grok-4-fast", + "name": "Grok 4 Fast", "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2026-01-27", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "modalities": { "input": [ "text", @@ -15264,87 +85626,87 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.75, - "output": 3.75, - "cache_read": 0.125 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 256000, + "context": 2000000, "output": 64000 } }, { - "id": "venice/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "family": "kimi-thinking", - "attachment": false, + "id": "zenmux/x-ai/grok-4.1-fast", + "name": "Grok 4.1 Fast", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-04", - "release_date": "2025-12-10", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.75, - "output": 3.2, - "cache_read": 0.375 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 256000, + "context": 2000000, "output": 64000 } }, { - "id": "venice/llama-3.2-3b", - "name": "Llama 3.2 3B", - "family": "llama", - "attachment": false, + "id": "zenmux/x-ai/grok-4.1-fast-non", + "name": "Grok 4.1 Fast Non Reasoning", + "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2024-10-03", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "limit": { - "context": 128000, - "output": 32000 + "context": 2000000, + "output": 64000 } }, { - "id": "venice/llama-3.3-70b", - "name": "Llama 3.3 70B", - "family": "llama", + "id": "zenmux/x-ai/grok-code-fast-1", + "name": "Grok Code Fast 1", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-12", - "release_date": "2025-04-06", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "modalities": { "input": [ "text" @@ -15353,26 +85715,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.7, - "output": 2.8 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 }, "limit": { - "context": 128000, - "output": 32000 + "context": 256000, + "output": 64000 } }, { - "id": "venice/minimax-m21", - "name": "MiniMax M2.1", - "family": "minimax", + "id": "zenmux/xiaomi/mimo-v2-flash", + "name": "MiMo-V2-Flash", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-12-01", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "modalities": { "input": [ "text" @@ -15381,27 +85744,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.04 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "limit": { - "context": 198000, - "output": 49500 + "context": 262000, + "output": 64000 } }, { - "id": "venice/minimax-m25", - "name": "MiniMax M2.5", - "family": "minimax", + "id": "zenmux/xiaomi/mimo-v2-flash-free", + "name": "MiMo-V2-Flash Free", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-13", + "knowledge": "2025-01-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "modalities": { "input": [ "text" @@ -15412,56 +85775,53 @@ }, "open_weights": false, "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.04 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 198000, - "output": 32000 + "context": 262000, + "output": 64000 } }, { - "id": "venice/mistral-31-24b", - "name": "Venice Medium", - "family": "mistral", - "attachment": true, - "reasoning": false, + "id": "zenmux/z-ai/glm-4.5", + "name": "GLM 4.5", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2025-03-18", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.5, - "output": 2.0 + "input": 0.35, + "output": 1.54, + "cache_read": 0.07 }, "limit": { "context": 128000, - "output": 32000 + "output": 64000 } }, { - "id": "venice/openai-gpt-52", - "name": "GPT-5.2", - "family": "gpt", + "id": "zenmux/z-ai/glm-4.5-air", + "name": "GLM 4.5 Air", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-08-31", - "release_date": "2025-12-13", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "modalities": { "input": [ "text" @@ -15472,30 +85832,28 @@ }, "open_weights": false, "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 0.11, + "output": 0.56, + "cache_read": 0.02 }, "limit": { - "context": 256000, + "context": 128000, "output": 64000 } }, { - "id": "venice/openai-gpt-52-codex", - "name": "GPT-5.2 Codex", - "family": "gpt-codex", - "attachment": true, + "id": "zenmux/z-ai/glm-4.6", + "name": "GLM 4.6", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-08", - "release_date": "2025-01-15", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -15503,113 +85861,117 @@ }, "open_weights": false, "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 0.35, + "output": 1.54, + "cache_read": 0.07 }, "limit": { - "context": 256000, + "context": 200000, "output": 64000 } }, { - "id": "venice/openai-gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "family": "gpt-oss", - "attachment": false, - "reasoning": false, + "id": "zenmux/z-ai/glm-4.6v", + "name": "GLM 4.6V", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-11-06", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.07, - "output": 0.3 + "input": 0.14, + "output": 0.42, + "cache_read": 0.03 }, "limit": { - "context": 128000, - "output": 32000 + "context": 200000, + "output": 64000 } }, { - "id": "venice/qwen3-235b-a22b-instruct", - "name": "Qwen 3 235B A22B Instruct 2507", - "family": "qwen", - "attachment": false, - "reasoning": false, + "id": "zenmux/z-ai/glm-4.6v-flash", + "name": "GLM 4.6V FlashX", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.15, - "output": 0.75 + "input": 0.02, + "output": 0.21, + "cache_read": 0.0043 }, "limit": { - "context": 128000, - "output": 32000 + "context": 200000, + "output": 64000 } }, { - "id": "venice/qwen3-235b-a22b-thinking", - "name": "Qwen 3 235B A22B Thinking 2507", - "family": "qwen", - "attachment": false, + "id": "zenmux/z-ai/glm-4.6v-flash-free", + "name": "GLM 4.6V Flash (Free)", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.45, - "output": 3.5 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 128000, - "output": 32000 + "context": 200000, + "output": 64000 } }, { - "id": "venice/qwen3-4b", - "name": "Venice Small", - "family": "qwen", + "id": "zenmux/z-ai/glm-4.7", + "name": "GLM 4.7", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-07", - "release_date": "2025-04-29", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "modalities": { "input": [ "text" @@ -15618,27 +85980,27 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.05, - "output": 0.15 + "input": 0.28, + "output": 1.14, + "cache_read": 0.06 }, "limit": { - "context": 32000, - "output": 8000 + "context": 200000, + "output": 64000 } }, { - "id": "venice/qwen3-coder-480b-a35b-instruct", - "name": "Qwen 3 Coder 480b", - "family": "qwen", + "id": "zenmux/z-ai/glm-4.7-flash-free", + "name": "GLM 4.7 Flash (Free)", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "modalities": { "input": [ "text" @@ -15647,27 +86009,26 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.75, - "output": 3.0 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 256000, + "context": 200000, "output": 64000 } }, { - "id": "venice/qwen3-next-80b", - "name": "Qwen 3 Next 80b", - "family": "qwen", + "id": "zenmux/z-ai/glm-4.7-flashx", + "name": "GLM 4.7 FlashX", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "modalities": { "input": [ "text" @@ -15676,56 +86037,57 @@ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.35, - "output": 1.9 + "input": 0.07, + "output": 0.42, + "cache_read": 0.01 }, "limit": { - "context": 256000, + "context": 200000, "output": 64000 } }, { - "id": "venice/qwen3-vl-235b-a22b", - "name": "Qwen3 VL 235B", - "family": "qwen", - "attachment": true, - "reasoning": false, + "id": "zenmux/z-ai/glm-5", + "name": "GLM 5", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2026-01-16", - "last_updated": "2026-01-28", + "knowledge": "2025-01-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": true, + "open_weights": false, "cost": { - "input": 0.25, - "output": 1.5 + "input": 0.58, + "output": 2.6, + "cache_read": 0.14 }, "limit": { - "context": 256000, - "output": 64000 + "context": 200000, + "output": 128000 } }, { - "id": "venice/venice-uncensored", - "name": "Venice Uncensored 1.1", - "family": "venice", + "id": "zhipuai-coding-plan/glm-4.5", + "name": "GLM-4.5", + "family": "glm", "attachment": false, - "reasoning": false, - "tool_call": false, + "reasoning": true, + "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2025-03-18", - "last_updated": "2026-01-28", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -15736,25 +86098,27 @@ }, "open_weights": true, "cost": { - "input": 0.2, - "output": 0.9 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 32000, - "output": 8000 + "context": 131072, + "output": 98304 } }, { - "id": "venice/zai-org-glm-4.7", - "name": "GLM 4.7", - "family": "glm", + "id": "zhipuai-coding-plan/glm-4.5-air", + "name": "GLM-4.5-Air", + "family": "glm-air", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2025-04", - "release_date": "2025-12-24", - "last_updated": "2026-01-28", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -15765,25 +86129,27 @@ }, "open_weights": true, "cost": { - "input": 0.55, - "output": 2.65, - "cache_read": 0.11 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 198000, - "output": 49500 + "context": 131072, + "output": 98304 } }, { - "id": "venice/zai-org-glm-4.7-flash", - "name": "GLM 4.7 Flash", + "id": "zhipuai-coding-plan/glm-4.5-flash", + "name": "GLM-4.5-Flash", "family": "glm-flash", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2026-01-29", - "last_updated": "2026-02-10", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -15794,27 +86160,32 @@ }, "open_weights": true, "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 128000, - "output": 32000 + "context": 131072, + "output": 98304 } }, { - "id": "venice/zai-org-glm-5", - "name": "GLM 5", + "id": "zhipuai-coding-plan/glm-4.5v", + "name": "GLM-4.5V", "family": "glm", - "attachment": false, + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -15822,26 +86193,25 @@ }, "open_weights": true, "cost": { - "input": 1.0, - "output": 3.2, - "cache_read": 0.2 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 198000, - "output": 49500 + "context": 64000, + "output": 16384 } }, { - "id": "x-ai/grok-2", - "name": "Grok 2 Latest", - "family": "grok", + "id": "zhipuai-coding-plan/glm-4.6", + "name": "GLM-4.6", + "family": "glm", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ "text" @@ -15850,89 +86220,91 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 2.0, - "output": 10.0, - "cache_read": 2.0 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 } }, { - "id": "x-ai/grok-2-vision", - "name": "Grok 2 Vision Latest", - "family": "grok", + "id": "zhipuai-coding-plan/glm-4.6v", + "name": "GLM-4.6V", + "family": "glm", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 2.0, - "output": 10.0, - "cache_read": 2.0 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 32768 } }, { - "id": "x-ai/grok-3", - "name": "Grok 3 Latest", - "family": "grok", - "attachment": false, - "reasoning": false, + "id": "zhipuai-coding-plan/glm-4.6v-flash", + "name": "GLM-4.6V-Flash", + "family": "glm", + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.75 + "input": 0.0, + "output": 0.0 }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 } }, { - "id": "x-ai/grok-3-fast", - "name": "Grok 3 Fast", - "family": "grok", + "id": "zhipuai-coding-plan/glm-4.7", + "name": "GLM-4.7", + "family": "glm", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "modalities": { "input": [ "text" @@ -15941,28 +86313,28 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 5.0, - "output": 25.0, - "cache_read": 1.25 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 } }, { - "id": "x-ai/grok-3-mini", - "name": "Grok 3 Mini", - "family": "grok", + "id": "zhipuai-coding-plan/glm-5", + "name": "GLM-5", + "family": "glm", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "modalities": { "input": [ "text" @@ -15973,26 +86345,27 @@ }, "open_weights": false, "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 } }, { - "id": "x-ai/grok-3-mini-fast", - "name": "Grok 3 Mini Fast Latest", - "family": "grok", + "id": "zhipuai/glm-4.5", + "name": "GLM-4.5", + "family": "glm", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -16001,28 +86374,29 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { "input": 0.6, - "output": 4.0, - "cache_read": 0.15 + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0.0 }, "limit": { "context": 131072, - "output": 8192 + "output": 98304 } }, { - "id": "x-ai/grok-4", - "name": "Grok 4", - "family": "grok", + "id": "zhipuai/glm-4.5-air", + "name": "GLM-4.5-Air", + "family": "glm-air", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ "text" @@ -16031,152 +86405,153 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 3.0, - "output": 15.0, - "cache_read": 0.75 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0.0 }, "limit": { - "context": 256000, - "output": 64000 + "context": 131072, + "output": 98304 } }, { - "id": "x-ai/grok-4-fast", - "name": "Grok 4 Fast", - "family": "grok", - "attachment": true, + "id": "zhipuai/glm-4.5-flash", + "name": "GLM-4.5-Flash", + "family": "glm-flash", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 98304 } }, { - "id": "x-ai/grok-4-fast-non", - "name": "Grok 4 Fast (Non-Reasoning)", - "family": "grok", + "id": "zhipuai/glm-4.5v", + "name": "GLM-4.5V", + "family": "glm", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.6, + "output": 1.8 }, "limit": { - "context": 2000000, - "output": 30000 + "context": 64000, + "output": 16384 } }, { - "id": "x-ai/grok-4.1-fast", - "name": "Grok 4.1 Fast", - "family": "grok", - "attachment": true, + "id": "zhipuai/glm-4.6", + "name": "GLM-4.6", + "family": "glm", + "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0.0 }, "limit": { - "context": 2000000, - "output": 30000 + "context": 204800, + "output": 131072 } }, { - "id": "x-ai/grok-4.1-fast-non", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "family": "grok", + "id": "zhipuai/glm-4.6v", + "name": "GLM-4.6V", + "family": "glm", "attachment": true, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.3, + "output": 0.9 }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 32768 } }, { - "id": "x-ai/grok-beta", - "name": "Grok Beta", - "family": "grok-beta", + "id": "zhipuai/glm-4.7", + "name": "GLM-4.7", + "family": "glm", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "modalities": { "input": [ "text" @@ -16185,28 +86560,29 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 5.0, - "output": 15.0, - "cache_read": 5.0 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0.0 }, "limit": { - "context": 131072, - "output": 4096 + "context": 204800, + "output": 131072 } }, { - "id": "x-ai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "family": "grok", + "id": "zhipuai/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "family": "glm-flash", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "modalities": { "input": [ "text" @@ -16215,32 +86591,31 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.0, + "output": 0.0, + "cache_read": 0.0, + "cache_write": 0.0 }, "limit": { - "context": 256000, - "output": 10000 + "context": 200000, + "output": 131072 } }, { - "id": "x-ai/grok-vision-beta", - "name": "Grok Vision Beta", - "family": "grok-vision", - "attachment": true, - "reasoning": false, + "id": "zhipuai/glm-5", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -16248,13 +86623,14 @@ }, "open_weights": false, "cost": { - "input": 5.0, - "output": 15.0, - "cache_read": 5.0 + "input": 1.0, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0.0 }, "limit": { - "context": 8192, - "output": 4096 + "context": 204800, + "output": 131072 } } ] \ No newline at end of file diff --git a/crates/goose/src/recipe/build_recipe/mod.rs b/crates/goose/src/recipe/build_recipe/mod.rs index 7c7e91518bcc..ddd7be58de49 100644 --- a/crates/goose/src/recipe/build_recipe/mod.rs +++ b/crates/goose/src/recipe/build_recipe/mod.rs @@ -153,7 +153,7 @@ where Ok((param_map, missing_params)) } -fn resolve_sub_recipe_path( +pub fn resolve_sub_recipe_path( sub_recipe_path: &str, parent_recipe_dir: &Path, ) -> Result { diff --git a/crates/goose/tests/providers.rs b/crates/goose/tests/providers.rs index 68e81de4bccc..6efb78d083aa 100644 --- a/crates/goose/tests/providers.rs +++ b/crates/goose/tests/providers.rs @@ -119,7 +119,10 @@ impl ProviderTester { .await .expect("get_prefixed_tools failed"); - let info = self.extension_manager.get_extensions_info().await; + let info = self + .extension_manager + .get_extensions_info(std::path::Path::new(".")) + .await; let system = PromptManager::new() .builder() .with_extensions(info.into_iter()) diff --git a/ui/desktop/openapi.json b/ui/desktop/openapi.json index 7ec30838f87f..d6c5b7e4da75 100644 --- a/ui/desktop/openapi.json +++ b/ui/desktop/openapi.json @@ -10,7 +10,7 @@ "license": { "name": "Apache-2.0" }, - "version": "1.24.0" + "version": "1.25.0" }, "paths": { "/action-required/tool-confirmation": { diff --git a/ui/desktop/package-lock.json b/ui/desktop/package-lock.json index 50127d4567ac..3394f8a20c7e 100644 --- a/ui/desktop/package-lock.json +++ b/ui/desktop/package-lock.json @@ -1,12 +1,12 @@ { "name": "goose-app", - "version": "1.24.0", + "version": "1.25.0", "lockfileVersion": 3, "requires": true, "packages": { "": { "name": "goose-app", - "version": "1.24.0", + "version": "1.25.0", "license": "Apache-2.0", "dependencies": { "@mcp-ui/client": "^6.1.0", diff --git a/ui/desktop/package.json b/ui/desktop/package.json index 78b2f52914bf..4c4e10f77190 100644 --- a/ui/desktop/package.json +++ b/ui/desktop/package.json @@ -1,7 +1,7 @@ { "name": "goose-app", "productName": "Goose", - "version": "1.24.0", + "version": "1.25.0", "description": "Goose App", "engines": { "node": "^24.10.0", diff --git a/ui/desktop/src/components/bottom_menu/BottomMenuExtensionSelection.tsx b/ui/desktop/src/components/bottom_menu/BottomMenuExtensionSelection.tsx index 468121086f61..221baab1a9ac 100644 --- a/ui/desktop/src/components/bottom_menu/BottomMenuExtensionSelection.tsx +++ b/ui/desktop/src/components/bottom_menu/BottomMenuExtensionSelection.tsx @@ -33,6 +33,11 @@ export const BottomMenuExtensionSelection = ({ sessionId }: BottomMenuExtensionS const { extensionsList: allExtensions } = useConfig(); const isHubView = !sessionId; + useEffect(() => { + setIsSessionExtensionsLoaded(false); + setSessionExtensions([]); + }, [sessionId]); + useEffect(() => { const handleExtensionsLoaded = () => { setRefreshTrigger((prev) => prev + 1); @@ -53,8 +58,11 @@ export const BottomMenuExtensionSelection = ({ sessionId }: BottomMenuExtensionS }; }, []); - // Fetch session-specific extensions or use global defaults useEffect(() => { + if (refreshTrigger === 0 && !isOpen) { + return; + } + const fetchExtensions = async () => { if (!sessionId) { return; @@ -75,7 +83,6 @@ export const BottomMenuExtensionSelection = ({ sessionId }: BottomMenuExtensionS } }; - setIsSessionExtensionsLoaded(false); fetchExtensions(); }, [sessionId, isOpen, refreshTrigger]); diff --git a/ui/desktop/src/hooks/useChatStream.ts b/ui/desktop/src/hooks/useChatStream.ts index aa0d1497b68a..ef78641c7736 100644 --- a/ui/desktop/src/hooks/useChatStream.ts +++ b/ui/desktop/src/hooks/useChatStream.ts @@ -433,6 +433,7 @@ export function useChatStream({ }, }, }); + window.dispatchEvent(new CustomEvent(AppEvents.SESSION_EXTENSIONS_LOADED)); onSessionLoaded?.(); return; } diff --git a/ui/desktop/src/platform/windows/bin/install-node.cmd b/ui/desktop/src/platform/windows/bin/install-node.cmd deleted file mode 100644 index 26abe9b09b03..000000000000 --- a/ui/desktop/src/platform/windows/bin/install-node.cmd +++ /dev/null @@ -1,37 +0,0 @@ -@echo off -setlocal enabledelayedexpansion - -REM Check if Node.js is installed in Program Files -if exist "C:\Program Files\nodejs\node.exe" ( - echo Node.js found in Program Files - set "NODE_EXE=C:\Program Files\nodejs\node.exe" - goto :found -) - -REM Check if Node.js is installed in Program Files (x86) -if exist "C:\Program Files (x86)\nodejs\node.exe" ( - echo "Node.js found in Program Files (x86)" - set "NODE_EXE=C:\Program Files (x86)\nodejs\node.exe" - goto :found -) - -echo Node.js not found in standard locations, installing... - -REM Download Node.js MSI installer -powershell -Command "& {[Net.ServicePointManager]::SecurityProtocol = [Net.SecurityProtocolType]::Tls12; Invoke-WebRequest -Uri '%1' -OutFile '%TEMP%\node-setup.msi'}" - -REM Install Node.js silently -msiexec /i "%TEMP%\node-setup.msi" /qn - -REM Wait a bit for installation to complete -timeout /t 5 /nobreak - -REM Clean up -del "%TEMP%\node-setup.msi" - -REM Set path to installed Node.js -set "NODE_EXE=C:\Program Files\nodejs\node.exe" - -:found -echo Using Node.js: %NODE_EXE% -exit /b 0 diff --git a/ui/desktop/src/platform/windows/bin/npx.cmd b/ui/desktop/src/platform/windows/bin/npx.cmd index 7c019e5ffe82..c297b146671d 100644 --- a/ui/desktop/src/platform/windows/bin/npx.cmd +++ b/ui/desktop/src/platform/windows/bin/npx.cmd @@ -1,31 +1,45 @@ @ECHO OFF SETLOCAL EnableDelayedExpansion -SET "SCRIPT_DIR=%~dp0" +SET "NODE_VERSION=22.14.0" +SET "GOOSE_NODE_DIR=%LOCALAPPDATA%\Goose\node" -REM Try to find Node.js in standard locations first -if exist "C:\Program Files\nodejs\npx.cmd" ( - "C:\Program Files\nodejs\npx.cmd" %* - exit /b %errorlevel% +REM === Check for previously downloaded portable Node.js (matching version) === +if exist "%GOOSE_NODE_DIR%\node-v%NODE_VERSION%.installed" ( + SET "PATH=%GOOSE_NODE_DIR%;!PATH!" + "%GOOSE_NODE_DIR%\npx.cmd" %* + exit /b !errorlevel! ) -if exist "C:\Program Files (x86)\nodejs\npx.cmd" ( - "C:\Program Files (x86)\nodejs\npx.cmd" %* - exit /b %errorlevel% -) +REM === Download portable Node.js === +echo [Goose] Node.js not found. Downloading portable Node.js v%NODE_VERSION%... 1>&2 + +SET "NODE_ZIP=%TEMP%\goose-node-%NODE_VERSION%.zip" +SET "NODE_EXTRACT=%TEMP%\goose-node-extract" -REM If Node.js not found, run installer -call "%SCRIPT_DIR%install-node.cmd" "https://nodejs.org/dist/v23.10.0/node-v23.10.0-x64.msi" +powershell -NoProfile -Command "$ProgressPreference='SilentlyContinue'; try { [Net.ServicePointManager]::SecurityProtocol=[Net.SecurityProtocolType]::Tls12; Invoke-WebRequest -Uri 'https://nodejs.org/dist/v%NODE_VERSION%/node-v%NODE_VERSION%-win-x64.zip' -OutFile '%NODE_ZIP%' -UseBasicParsing; Expand-Archive -Path '%NODE_ZIP%' -DestinationPath '%NODE_EXTRACT%' -Force; exit 0 } catch { Write-Error $_.Exception.Message; exit 1 }" if errorlevel 1 ( - echo Failed to install Node.js + echo [Goose] ERROR: Failed to download Node.js. Please install manually from https://nodejs.org/ 1>&2 + del "%NODE_ZIP%" >nul 2>&1 exit /b 1 ) -REM Try using the newly installed Node.js -if exist "C:\Program Files\nodejs\npx.cmd" ( - "C:\Program Files\nodejs\npx.cmd" %* - exit /b %errorlevel% +REM Clean previous version and install to Goose directory +rmdir /s /q "%GOOSE_NODE_DIR%" >nul 2>&1 +mkdir "%GOOSE_NODE_DIR%" >nul 2>&1 +xcopy /s /e /q /y "%NODE_EXTRACT%\node-v%NODE_VERSION%-win-x64\*" "%GOOSE_NODE_DIR%\" >nul 2>&1 + +REM Clean up +del "%NODE_ZIP%" >nul 2>&1 +rmdir /s /q "%NODE_EXTRACT%" >nul 2>&1 + +if exist "%GOOSE_NODE_DIR%\npx.cmd" ( + echo.>"%GOOSE_NODE_DIR%\node-v%NODE_VERSION%.installed" + SET "PATH=%GOOSE_NODE_DIR%;!PATH!" + echo [Goose] Node.js v%NODE_VERSION% ready. 1>&2 + "%GOOSE_NODE_DIR%\npx.cmd" %* + exit /b !errorlevel! ) -echo Failed to find npx after Node.js installation +echo [Goose] ERROR: Installation failed. Please install Node.js manually from https://nodejs.org/ 1>&2 exit /b 1 diff --git a/ui/desktop/src/utils/winShims.ts b/ui/desktop/src/utils/winShims.ts index 058591724a16..7b8170dadd21 100644 --- a/ui/desktop/src/utils/winShims.ts +++ b/ui/desktop/src/utils/winShims.ts @@ -21,7 +21,7 @@ export async function ensureWinShims(): Promise { await fs.promises.mkdir(tgtDir, { recursive: true }); // Copy command-line tools, NOT goosed.exe (which should always be used locally) - const shims = ['uvx.exe', 'uv.exe', 'npx.cmd', 'install-node.cmd']; + const shims = ['uvx.exe', 'uv.exe', 'npx.cmd']; await Promise.all( shims.map(async (shim) => {