{ "*/1-month-commitment/cohere.command-light-text-v14" : {"mode": "chat", "provider": "bedrock", "base_model": "command-light-text-v14", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_second": 0.001902, "output_cost_per_second": 0.001902}, "*/1-month-commitment/cohere.command-text-v14" : {"mode": "chat", "provider": "bedrock", "base_model": "command-text-v14", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_second": 0.011, "output_cost_per_second": 0.011}, "*/6-month-commitment/cohere.command-light-text-v14" : {"mode": "chat", "provider": "bedrock", "base_model": "command-light-text-v14", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_second": 0.0011416, "output_cost_per_second": 0.0011416}, "*/6-month-commitment/cohere.command-text-v14" : {"mode": "chat", "provider": "bedrock", "base_model": "command-text-v14", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_second": 0.0066027, "output_cost_per_second": 0.0066027}, "1024-x-1024/dall-e-3" : {"mode": "image_generation", "provider": "openai", "base_model": "dall-e-3", "input_cost_per_pixel": 0.0000000381469, "output_cost_per_pixel": 0}, "1024-x-1024/gpt-image-1" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1", "input_cost_per_image": 0.042, "input_cost_per_pixel": 0.000000040054321, "output_cost_per_pixel": 0}, "1024-x-1024/gpt-image-1-mini" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1-mini", "input_cost_per_image": 0.011}, "1024-x-1024/gpt-image-1.5" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1.5", "input_cost_per_image": 0.034}, "1024-x-1024/gpt-image-1.5-2025-12-16" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1.5", "input_cost_per_image": 0.009}, "1024-x-1536/gpt-image-1" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1", "input_cost_per_image": 0.25, "input_cost_per_pixel": 0.000000158945719, "output_cost_per_pixel": 0}, "1024-x-1536/gpt-image-1-mini" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1-mini", "input_cost_per_image": 0.015}, "1024-x-1536/gpt-image-1.5" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1.5", "input_cost_per_image": 0.013}, "1024-x-1536/gpt-image-1.5-2025-12-16" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1.5", "input_cost_per_image": 0.05}, "1024-x-1792/dall-e-3" : {"mode": "image_generation", "provider": "openai", "base_model": "dall-e-3", "input_cost_per_pixel": 0.00000006539, "output_cost_per_pixel": 0}, "1536-x-1024/gpt-image-1" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1", "input_cost_per_image": 0.063, "input_cost_per_pixel": 0.000000040054321, "output_cost_per_pixel": 0}, "1536-x-1024/gpt-image-1-mini" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1-mini", "input_cost_per_image": 0.015}, "1536-x-1024/gpt-image-1.5" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1.5", "input_cost_per_image": 0.013}, "1536-x-1024/gpt-image-1.5-2025-12-16" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1.5", "input_cost_per_image": 0.2}, "1792-x-1024/dall-e-3" : {"mode": "image_generation", "provider": "openai", "base_model": "dall-e-3", "input_cost_per_pixel": 0.00000006539, "output_cost_per_pixel": 0}, "50-steps/bedrock/amazon.nova-canvas-v1:0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "nova-canvas", "max_input_tokens": 2600, "output_cost_per_image": 0.06}, "50-steps/stability.stable-diffusion-xl-v0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "stable-diffusion-xl-v0", "max_input_tokens": 77, "output_cost_per_image": 0.018}, "50-steps/stability.stable-diffusion-xl-v1" : {"mode": "image_generation", "provider": "bedrock", "base_model": "stable-diffusion-xl-v1", "max_input_tokens": 77, "output_cost_per_image": 0.04}, "@cf/meta/llama-2-7b-chat-fp16" : {"mode": "chat", "provider": "cloudflare", "max_input_tokens": 3072, "max_output_tokens": 3072, "input_cost_per_token": 0.000001923, "output_cost_per_token": 0.000001923}, "@cf/meta/llama-2-7b-chat-int8" : {"mode": "chat", "provider": "cloudflare", "max_input_tokens": 2048, "max_output_tokens": 2048, "input_cost_per_token": 0.000001923, "output_cost_per_token": 0.000001923}, "@cf/mistral/mistral-7b-instruct-v0.1" : {"mode": "chat", "provider": "cloudflare", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.000001923, "output_cost_per_token": 0.000001923}, "@hf/thebloke/codellama-7b-instruct-awq" : {"mode": "chat", "provider": "cloudflare", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001923, "output_cost_per_token": 0.000001923}, "BAAI/bge-base-en-v1.5" : {"mode": "embedding", "provider": "together_ai", "base_model": "bge-base-en", "max_input_tokens": 512, "input_cost_per_token": 0.000000008, "output_cost_per_token": 0}, "BAAI/bge-en-icl" : {"mode": "embedding", "provider": "nebius", "base_model": "bge-en-icl", "max_input_tokens": 32768, "input_cost_per_token": 0.00000001, "output_cost_per_token": 0}, "BAAI/bge-multilingual-gemma2" : {"mode": "embedding", "provider": "nebius", "base_model": "bge-multilingual-gemma2", "max_input_tokens": 8192, "input_cost_per_token": 0.00000001, "output_cost_per_token": 0}, "BSC-LT/ALIA-40b-instruct_Q8_0" : {"mode": "chat", "provider": "publicai", "base_model": "alia-40b-instruct-q8-0", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "BSC-LT/salamandra-7b-instruct-tools-16k" : {"mode": "chat", "provider": "publicai", "base_model": "salamandra-7b-instruct-tools-16k", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "Cohere-embed-v3-english" : {"mode": "embedding", "provider": "azure", "base_model": "embed-v3-english", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "Cohere-embed-v3-multilingual" : {"mode": "embedding", "provider": "azure", "base_model": "embed-v3-multilingual", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "DeepSeek-R1" : {"mode": "chat", "provider": "sambanova", "base_model": "deepseek-r1", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000007}, "DeepSeek-R1-Distill-Llama-70B" : {"mode": "chat", "provider": "ovhcloud", "base_model": "deepseek-r1-distill-llama-70b", "max_input_tokens": 131000, "max_output_tokens": 131000, "input_cost_per_token": 0.00000067, "output_cost_per_token": 0.00000067}, "DeepSeek-V3-0324" : {"mode": "chat", "provider": "sambanova", "base_model": "deepseek-v3", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.0000045}, "DeepSeek-V3.1" : {"mode": "chat", "provider": "sambanova", "base_model": "deepseek-v3.1", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.0000045}, "Embeddings" : {"mode": "embedding", "provider": "gigachat", "base_model": "embeddings", "max_input_tokens": 512, "input_cost_per_token": 0, "output_cost_per_token": 0}, "Embeddings-2" : {"mode": "embedding", "provider": "gigachat", "base_model": "embeddings-2", "max_input_tokens": 512, "input_cost_per_token": 0, "output_cost_per_token": 0}, "EmbeddingsGigaR" : {"mode": "embedding", "provider": "gigachat", "base_model": "embeddingsgigar", "max_input_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "FLUX-1.1-pro" : {"mode": "image_generation", "provider": "azure", "base_model": "flux-1.1-pro", "output_cost_per_image": 0.04}, "FLUX.1-Kontext-pro" : {"mode": "image_generation", "provider": "azure", "base_model": "flux.1-kontext-pro", "output_cost_per_image": 0.04}, "Gemma-3-4b-it-GGUF" : {"mode": "chat", "provider": "lemonade", "base_model": "gemma-3-4b-it", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "GigaChat-2-Lite" : {"mode": "chat", "provider": "gigachat", "base_model": "gigachat-2-lite", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "GigaChat-2-Max" : {"mode": "chat", "provider": "gigachat", "base_model": "gigachat-2-max", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "GigaChat-2-Pro" : {"mode": "chat", "provider": "gigachat", "base_model": "gigachat-2-pro", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "Gryphe/MythoMax-L2-13b" : {"mode": "chat", "provider": "deepinfra", "base_model": "mythomax-l2-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000009}, "HuggingFaceH4/zephyr-7b-beta" : {"mode": "chat", "provider": "anyscale", "base_model": "zephyr-7b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "Llama-3.1-8B-Instruct" : {"mode": "chat", "provider": "ovhcloud", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 131000, "max_output_tokens": 131000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "Llama-3.2-11B-Vision-Instruct" : {"mode": "chat", "provider": "azure", "base_model": "llama-3.2-11b-vision-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000037, "output_cost_per_token": 0.00000037}, "Llama-3.2-90B-Vision-Instruct" : {"mode": "chat", "provider": "azure", "base_model": "llama-3.2-90b-vision-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000204, "output_cost_per_token": 0.00000204}, "Llama-3.3-70B-Instruct" : {"mode": "chat", "provider": "meta_llama", "base_model": "llama-3.3-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4028}, "Llama-3.3-8B-Instruct" : {"mode": "chat", "provider": "meta_llama", "base_model": "llama-3.3-8b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4028}, "Llama-4-Maverick-17B-128E-Instruct" : {"mode": "chat", "provider": "sambanova", "base_model": "llama-4-maverick-17b-128e-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000063, "output_cost_per_token": 0.0000018}, "Llama-4-Maverick-17B-128E-Instruct-FP8" : {"mode": "chat", "provider": "azure", "base_model": "llama-4-maverick-17b-128e-instruct-fp8", "max_input_tokens": 1000000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000141, "output_cost_per_token": 0.00000035}, "Llama-4-Scout-17B-16E-Instruct" : {"mode": "chat", "provider": "azure", "base_model": "llama-4-scout-17b-16e-instruct", "max_input_tokens": 10000000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.00000078}, "Llama-4-Scout-17B-16E-Instruct-FP8" : {"mode": "chat", "provider": "meta_llama", "base_model": "llama-4-scout-17b-16e-instruct-fp8", "max_input_tokens": 10000000, "max_output_tokens": 4028}, "MAI-DS-R1" : {"mode": "chat", "provider": "azure", "base_model": "mai-ds-r1", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000135, "output_cost_per_token": 0.0000054}, "Meta-Llama-3-70B-Instruct" : {"mode": "chat", "provider": "azure", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 2048, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.00000037}, "Meta-Llama-3.1-405B-Instruct" : {"mode": "chat", "provider": "azure", "base_model": "llama-3.1-405b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000533, "output_cost_per_token": 0.000016}, "Meta-Llama-3.1-70B-Instruct" : {"mode": "chat", "provider": "azure", "base_model": "llama-3.1-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000268, "output_cost_per_token": 0.00000354}, "Meta-Llama-3.1-8B-Instruct" : {"mode": "chat", "provider": "sambanova", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000002}, "Meta-Llama-3.2-1B-Instruct" : {"mode": "chat", "provider": "sambanova", "base_model": "llama-3.2-1b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000008}, "Meta-Llama-3.2-3B-Instruct" : {"mode": "chat", "provider": "sambanova", "base_model": "llama-3.2-3b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000016}, "Meta-Llama-3.3-70B-Instruct" : {"mode": "chat", "provider": "sambanova", "base_model": "llama-3.3-70b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000012}, "Meta-Llama-3_1-70B-Instruct" : {"mode": "chat", "provider": "ovhcloud", "base_model": "llama-3-1-70b-instruct", "max_input_tokens": 131000, "max_output_tokens": 131000, "input_cost_per_token": 0.00000067, "output_cost_per_token": 0.00000067}, "Meta-Llama-3_3-70B-Instruct" : {"mode": "chat", "provider": "ovhcloud", "base_model": "llama-3-3-70b-instruct", "max_input_tokens": 131000, "max_output_tokens": 131000, "input_cost_per_token": 0.00000067, "output_cost_per_token": 0.00000067}, "Meta-Llama-Guard-3-8B" : {"mode": "chat", "provider": "sambanova", "base_model": "llama-guard-3-8b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000003}, "MiniMax-M2" : {"mode": "chat", "provider": "minimax", "base_model": "minimax-m2", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.000000375}, "MiniMax-M2.1" : {"mode": "chat", "provider": "minimax", "base_model": "minimax-m2.1", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.000000375}, "MiniMax-M2.1-lightning" : {"mode": "chat", "provider": "minimax", "base_model": "minimax-m2.1-lightning", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000024, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.000000375}, "MiniMax-M2.5" : {"mode": "chat", "provider": "minimax", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.000000375}, "MiniMax-M2.5-lightning" : {"mode": "chat", "provider": "minimax", "base_model": "minimax-m2.5-lightning", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000024, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.000000375}, "MiniMax-M2.7" : {"mode": "chat", "provider": "sambanova", "base_model": "minimax-m2.7", "max_input_tokens": 204800, "max_output_tokens": 131072, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "MiniMaxAI/MiniMax-M2.1" : {"mode": "chat", "provider": "gmi", "base_model": "minimax-m2.1", "max_input_tokens": 196608, "max_output_tokens": 16384, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "MiniMaxAI/MiniMax-M2.5" : {"mode": "chat", "provider": "wandb", "base_model": "minimax-m2.5", "max_input_tokens": 197000, "max_output_tokens": 197000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "Mistral-7B-Instruct-v0.3" : {"mode": "chat", "provider": "ovhcloud", "base_model": "mistral-7b-instruct", "max_input_tokens": 127000, "max_output_tokens": 127000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "Mistral-Nemo-Instruct-2407" : {"mode": "chat", "provider": "ovhcloud", "base_model": "mistral-nemo-instruct", "max_input_tokens": 118000, "max_output_tokens": 118000, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000013}, "Mistral-Small-3.2-24B-Instruct-2506" : {"mode": "chat", "provider": "ovhcloud", "base_model": "mistral-small-3.2-24b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000009, "output_cost_per_token": 0.00000028}, "Mixtral-8x7B-Instruct-v0.1" : {"mode": "chat", "provider": "ovhcloud", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000063, "output_cost_per_token": 0.00000063}, "NousResearch/Hermes-3-Llama-3.1-405B" : {"mode": "chat", "provider": "deepinfra", "base_model": "hermes-3-llama-3.1-405b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001}, "NousResearch/Hermes-3-Llama-3.1-70B" : {"mode": "chat", "provider": "hyperbolic", "base_model": "hermes-3-llama-3.1-70b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.0000003}, "Phi-3-medium-128k-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-3-medium-128k-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000017, "output_cost_per_token": 0.00000068}, "Phi-3-medium-4k-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-3-medium-4k-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000017, "output_cost_per_token": 0.00000068}, "Phi-3-mini-128k-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-3-mini-128k-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000052}, "Phi-3-mini-4k-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-3-mini-4k-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000052}, "Phi-3-small-128k-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-3-small-128k-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "Phi-3-small-8k-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-3-small-8k-instruct", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "Phi-3.5-MoE-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-3.5-moe-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000016, "output_cost_per_token": 0.00000064}, "Phi-3.5-mini-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-3.5-mini-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000052}, "Phi-3.5-vision-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-3.5-vision-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000052}, "Phi-4" : {"mode": "chat", "provider": "azure", "base_model": "phi-4", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.0000005}, "Phi-4-mini-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-4-mini-instruct", "max_input_tokens": 131072, "max_output_tokens": 4096, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003}, "Phi-4-mini-reasoning" : {"mode": "chat", "provider": "azure", "base_model": "phi-4-mini", "max_input_tokens": 131072, "max_output_tokens": 4096, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000032}, "Phi-4-multimodal-instruct" : {"mode": "chat", "provider": "azure", "base_model": "phi-4-multimodal-instruct", "max_input_tokens": 131072, "max_output_tokens": 4096, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000032, "input_cost_per_audio_token": 0.000004}, "Phi-4-reasoning" : {"mode": "chat", "provider": "azure", "base_model": "phi-4", "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.0000005}, "QwQ-32B" : {"mode": "chat", "provider": "sambanova", "base_model": "qwq-32b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.000001}, "Qwen/QwQ-32B" : {"mode": "chat", "provider": "hyperbolic", "base_model": "qwq-32b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "Qwen/Qwen2-VL-72B-Instruct" : {"mode": "chat", "provider": "nebius", "base_model": "qwen2-vl-72b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.0000004}, "Qwen/Qwen2-VL-7B-Instruct" : {"mode": "chat", "provider": "nebius", "base_model": "qwen2-vl-7b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0.00000006}, "Qwen/Qwen2.5-32B-Instruct" : {"mode": "chat", "provider": "nebius", "base_model": "qwen2.5-32b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.0000002}, "Qwen/Qwen2.5-72B-Instruct" : {"mode": "chat", "provider": "nebius", "base_model": "qwen2.5-72b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.0000004}, "Qwen/Qwen2.5-72B-Instruct-Turbo" : {"mode": "chat", "provider": "together_ai", "base_model": "qwen2.5-72b-instruct-turbo"}, "Qwen/Qwen2.5-7B-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "qwen2.5-7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.0000001}, "Qwen/Qwen2.5-7B-Instruct-Turbo" : {"mode": "chat", "provider": "together_ai", "base_model": "qwen2.5-7b-instruct-turbo"}, "Qwen/Qwen2.5-Coder-32B-Instruct" : {"mode": "chat", "provider": "nscale", "base_model": "qwen2.5-coder-32b-instruct", "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.0000002}, "Qwen/Qwen2.5-Coder-3B-Instruct" : {"mode": "chat", "provider": "nscale", "base_model": "qwen2.5-coder-3b-instruct", "input_cost_per_token": 0.00000001, "output_cost_per_token": 0.00000003}, "Qwen/Qwen2.5-Coder-7B" : {"mode": "chat", "provider": "nebius", "base_model": "qwen2.5-coder-7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000001, "output_cost_per_token": 0.00000003}, "Qwen/Qwen2.5-Coder-7B-Instruct" : {"mode": "chat", "provider": "nscale", "base_model": "qwen2.5-coder-7b-instruct", "input_cost_per_token": 0.00000001, "output_cost_per_token": 0.00000003}, "Qwen/Qwen2.5-VL-32B-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "qwen2.5-vl-32b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "Qwen/Qwen2.5-VL-72B-Instruct" : {"mode": "chat", "provider": "nebius", "base_model": "qwen2.5-vl-72b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.0000004}, "Qwen/Qwen3-14B" : {"mode": "chat", "provider": "nebius", "base_model": "qwen3-14b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000024}, "Qwen/Qwen3-235B-A22B" : {"mode": "chat", "provider": "nebius", "base_model": "qwen3-235b-a22b", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "Qwen/Qwen3-235B-A22B-Instruct-2507" : {"mode": "chat", "provider": "wandb", "base_model": "qwen3-235b-a22b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.01, "output_cost_per_token": 0.01}, "Qwen/Qwen3-235B-A22B-Instruct-2507-tput" : {"mode": "chat", "provider": "together_ai", "base_model": "qwen3-235b-a22b-instruct", "max_input_tokens": 262000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.000006}, "Qwen/Qwen3-235B-A22B-Thinking-2507" : {"mode": "chat", "provider": "deepinfra", "base_model": "qwen3-235b-a22b-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000029}, "Qwen/Qwen3-235B-A22B-fp8-tput" : {"mode": "chat", "provider": "together_ai", "base_model": "qwen3-235b-a22b-fp8", "max_input_tokens": 40000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "Qwen/Qwen3-30B-A3B" : {"mode": "chat", "provider": "nebius", "base_model": "qwen3-30b-a3b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "Qwen/Qwen3-32B" : {"mode": "chat", "provider": "deepinfra", "base_model": "qwen3-32b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.00000028}, "Qwen/Qwen3-4B" : {"mode": "chat", "provider": "nebius", "base_model": "qwen3-4b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000024}, "Qwen/Qwen3-Coder-480B-A35B-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "qwen3-coder-480b-a35b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000016}, "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8" : {"mode": "chat", "provider": "together_ai", "base_model": "qwen3-coder-480b-a35b-instruct-fp8", "max_input_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002}, "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo" : {"mode": "chat", "provider": "deepinfra", "base_model": "qwen3-coder-480b-a35b-instruct-turbo", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000029, "output_cost_per_token": 0.0000012}, "Qwen/Qwen3-Next-80B-A3B-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "qwen3-next-80b-a3b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.0000014}, "Qwen/Qwen3-Next-80B-A3B-Thinking" : {"mode": "chat", "provider": "together_ai", "base_model": "qwen3-next-80b-a3b-thinking", "max_input_tokens": 262144, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000015}, "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8" : {"mode": "chat", "provider": "gmi", "base_model": "qwen3-vl-235b-a22b-instruct-fp8", "max_input_tokens": 262144, "max_output_tokens": 16384, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000014}, "Qwen/Qwen3.5-397B-A17B" : {"mode": "chat", "provider": "together_ai", "base_model": "qwen3.5-397b-a17b", "max_input_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000036}, "Qwen2-Audio-7B-Instruct" : {"mode": "chat", "provider": "sambanova", "base_model": "qwen2-audio-7b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0001}, "Qwen2.5-Coder-32B-Instruct" : {"mode": "chat", "provider": "ovhcloud", "base_model": "qwen2.5-coder-32b-instruct", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000087, "output_cost_per_token": 0.00000087}, "Qwen2.5-VL-72B-Instruct" : {"mode": "chat", "provider": "ovhcloud", "base_model": "qwen2.5-vl-72b-instruct", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000091, "output_cost_per_token": 0.00000091}, "Qwen3-32B" : {"mode": "chat", "provider": "sambanova", "base_model": "qwen3-32b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000008}, "Qwen3-4B-Instruct-2507-GGUF" : {"mode": "chat", "provider": "lemonade", "base_model": "qwen3-4b-instruct", "max_input_tokens": 262144, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "Qwen3-Coder-30B-A3B-Instruct-GGUF" : {"mode": "chat", "provider": "lemonade", "base_model": "qwen3-coder-30b-a3b-instruct", "max_input_tokens": 262144, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "Sao10K/L3-8B-Lunaris-v1-Turbo" : {"mode": "chat", "provider": "deepinfra", "base_model": "l3-8b-lunaris-v1-turbo", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000005}, "Sao10K/L3-8B-Stheno-v3.2" : {"mode": "chat", "provider": "novita", "base_model": "l3-8b-stheno", "max_input_tokens": 8192, "max_output_tokens": 32000, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000005}, "Sao10K/L3.1-70B-Euryale-v2.2" : {"mode": "chat", "provider": "deepinfra", "base_model": "l3.1-70b-euryale", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000075}, "Sao10K/L3.3-70B-Euryale-v2.3" : {"mode": "chat", "provider": "deepinfra", "base_model": "l3.3-70b-euryale", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000075}, "WhereIsAI/UAE-Large-V1" : {"mode": "embedding", "provider": "fireworks", "base_model": "uae-large-v1", "max_input_tokens": 512, "input_cost_per_token": 0.000000016, "output_cost_per_token": 0}, "accounts/fireworks/models/" : {"mode": "embedding", "provider": "fireworks", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "accounts/fireworks/models/SSD-1B" : {"mode": "image_generation", "provider": "fireworks", "base_model": "ssd-1b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000000013, "output_cost_per_token": 0.00000000013}, "accounts/fireworks/models/chronos-hermes-13b-v2" : {"mode": "chat", "provider": "fireworks", "base_model": "chronos-hermes-13b-v2", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/code-llama-13b" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-13b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/code-llama-13b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-13b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/code-llama-13b-python" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-13b-python", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/code-llama-34b" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-34b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/code-llama-34b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-34b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/code-llama-34b-python" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-34b-python", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/code-llama-70b" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-70b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/code-llama-70b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-70b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/code-llama-70b-python" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-70b-python", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/code-llama-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-7b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/code-llama-7b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-7b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/code-llama-7b-python" : {"mode": "chat", "provider": "fireworks", "base_model": "codellama-7b-python", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/code-qwen-1p5-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "code-qwen-1.5-7b", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/codegemma-2b" : {"mode": "chat", "provider": "fireworks", "base_model": "codegemma-2b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/codegemma-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "codegemma-7b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/cogito-671b-v2-p1" : {"mode": "chat", "provider": "fireworks", "base_model": "cogito-671b-v2-p1", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/cogito-v1-preview-llama-3b" : {"mode": "chat", "provider": "fireworks", "base_model": "cogito-v1-llama-3b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/cogito-v1-preview-llama-70b" : {"mode": "chat", "provider": "fireworks", "base_model": "cogito-v1-llama-70b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/cogito-v1-preview-llama-8b" : {"mode": "chat", "provider": "fireworks", "base_model": "cogito-v1-llama-8b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/cogito-v1-preview-qwen-14b" : {"mode": "chat", "provider": "fireworks", "base_model": "cogito-v1-qwen-14b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/cogito-v1-preview-qwen-32b" : {"mode": "chat", "provider": "fireworks", "base_model": "cogito-v1-qwen-32b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/dbrx-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "dbrx-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/deepseek-coder-1b-base" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-coder-1b-base", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/deepseek-coder-33b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-coder-33b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/deepseek-coder-7b-base" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-coder-7b-base", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/deepseek-coder-7b-base-v1p5" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-coder-7b-base-v1.5", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/deepseek-coder-7b-instruct-v1p5" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-coder-7b-instruct-v1.5", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/deepseek-coder-v2-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-coder-v2-instruct", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/deepseek-coder-v2-lite-base" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-coder-v2-lite-base", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/deepseek-coder-v2-lite-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-coder-v2-lite-instruct", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/deepseek-prover-v2" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-prover-v2", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/deepseek-r1" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1", "max_input_tokens": 128000, "max_output_tokens": 20480, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000008}, "accounts/fireworks/models/deepseek-r1-0528" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1", "max_input_tokens": 160000, "max_output_tokens": 160000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000008}, "accounts/fireworks/models/deepseek-r1-0528-distill-qwen3-8b" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1-0528-distill-qwen3-8b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/deepseek-r1-basic" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1-basic", "max_input_tokens": 128000, "max_output_tokens": 20480, "input_cost_per_token": 0.00000055, "output_cost_per_token": 0.00000219}, "accounts/fireworks/models/deepseek-r1-distill-llama-70b" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1-distill-llama-70b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/deepseek-r1-distill-llama-8b" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1-distill-llama-8b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/deepseek-r1-distill-qwen-14b" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1-distill-qwen-14b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/deepseek-r1-distill-qwen-1p5b" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1-distill-qwen-1.5b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/deepseek-r1-distill-qwen-32b" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1-distill-qwen-32b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/deepseek-r1-distill-qwen-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-r1-distill-qwen-7b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/deepseek-v2-lite-chat" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-v2-lite-chat", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/deepseek-v2p5" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-v2.5", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/deepseek-v3" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-v3", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/deepseek-v3-0324" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-v3", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/deepseek-v3p1" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-v3.1", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000056, "output_cost_per_token": 0.00000168}, "accounts/fireworks/models/deepseek-v3p1-terminus" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-v3.1-terminus", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000056, "output_cost_per_token": 0.00000168}, "accounts/fireworks/models/deepseek-v3p2" : {"mode": "chat", "provider": "fireworks", "base_model": "deepseek-v3.2", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000056, "output_cost_per_token": 0.00000168}, "accounts/fireworks/models/devstral-small-2505" : {"mode": "chat", "provider": "fireworks", "base_model": "devstral-small", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/dobby-mini-unhinged-plus-llama-3-1-8b" : {"mode": "chat", "provider": "fireworks", "base_model": "dobby-mini-unhinged-plus-llama-3-1-8b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/dobby-unhinged-llama-3-3-70b-new" : {"mode": "chat", "provider": "fireworks", "base_model": "dobby-unhinged-llama-3-3-70b-new", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/dolphin-2-9-2-qwen2-72b" : {"mode": "chat", "provider": "fireworks", "base_model": "dolphin-2-9-2-qwen2-72b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/dolphin-2p6-mixtral-8x7b" : {"mode": "chat", "provider": "fireworks", "base_model": "dolphin-2.6-mixtral-8x7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/ernie-4p5-21b-a3b-pt" : {"mode": "chat", "provider": "fireworks", "base_model": "ernie-4.5-21b-a3b-pt", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/ernie-4p5-300b-a47b-pt" : {"mode": "chat", "provider": "fireworks", "base_model": "ernie-4.5-300b-a47b-pt", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/fare-20b" : {"mode": "chat", "provider": "fireworks", "base_model": "fare-20b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/firefunction-v1" : {"mode": "chat", "provider": "fireworks", "base_model": "firefunction-v1", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/firefunction-v2" : {"mode": "chat", "provider": "fireworks", "base_model": "firefunction-v2", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/firellava-13b" : {"mode": "chat", "provider": "fireworks", "base_model": "firellava-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/firesearch-ocr-v6" : {"mode": "chat", "provider": "fireworks", "base_model": "firesearch-ocr-v6", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/fireworks-asr-large" : {"mode": "audio_transcription", "provider": "fireworks", "base_model": "fireworks-asr-large", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "accounts/fireworks/models/fireworks-asr-v2" : {"mode": "audio_transcription", "provider": "fireworks", "base_model": "fireworks-asr-v2", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "accounts/fireworks/models/flux-1-dev" : {"mode": "chat", "provider": "fireworks", "base_model": "flux-1-dev", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/flux-1-dev-controlnet-union" : {"mode": "chat", "provider": "fireworks", "base_model": "flux-1-dev-controlnet-union", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000000001, "output_cost_per_token": 0.000000001}, "accounts/fireworks/models/flux-1-dev-fp8" : {"mode": "image_generation", "provider": "fireworks", "base_model": "flux-1-dev-fp8", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000000005, "output_cost_per_token": 0.0000000005}, "accounts/fireworks/models/flux-1-schnell" : {"mode": "chat", "provider": "fireworks", "base_model": "flux-1-schnell", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/flux-1-schnell-fp8" : {"mode": "image_generation", "provider": "fireworks", "base_model": "flux-1-schnell-fp8", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000000035, "output_cost_per_token": 0.00000000035}, "accounts/fireworks/models/flux-kontext-max" : {"mode": "image_generation", "provider": "fireworks", "base_model": "flux-kontext-max", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000008}, "accounts/fireworks/models/flux-kontext-pro" : {"mode": "image_generation", "provider": "fireworks", "base_model": "flux-kontext-pro", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000004}, "accounts/fireworks/models/gemma-2b-it" : {"mode": "chat", "provider": "fireworks", "base_model": "gemma-2b-it", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/gemma-3-27b-it" : {"mode": "chat", "provider": "fireworks", "base_model": "gemma-3-27b-it", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/gemma-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "gemma-7b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/gemma-7b-it" : {"mode": "chat", "provider": "fireworks", "base_model": "gemma-7b-it", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/gemma2-9b-it" : {"mode": "chat", "provider": "fireworks", "base_model": "gemma-2-9b-it", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/glm-4p5" : {"mode": "chat", "provider": "fireworks", "base_model": "glm-4.5", "max_input_tokens": 128000, "max_output_tokens": 96000, "input_cost_per_token": 0.00000055, "output_cost_per_token": 0.00000219}, "accounts/fireworks/models/glm-4p5-air" : {"mode": "chat", "provider": "fireworks", "base_model": "glm-4.5-air", "max_input_tokens": 128000, "max_output_tokens": 96000, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000088}, "accounts/fireworks/models/glm-4p5v" : {"mode": "chat", "provider": "fireworks", "base_model": "glm-4.5v", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/glm-4p6" : {"mode": "chat", "provider": "fireworks", "base_model": "glm-4.6", "max_input_tokens": 202800, "max_output_tokens": 202800, "input_cost_per_token": 0.00000055, "output_cost_per_token": 0.00000219}, "accounts/fireworks/models/glm-4p7" : {"mode": "chat", "provider": "fireworks", "base_model": "glm-4.7", "max_input_tokens": 202800, "max_output_tokens": 202800, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.0000003}, "accounts/fireworks/models/glm-5p1" : {"mode": "chat", "provider": "fireworks", "base_model": "glm-5.1", "max_input_tokens": 202800, "max_output_tokens": 202800, "input_cost_per_token": 0.0000014, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000026}, "accounts/fireworks/models/gpt-oss-120b" : {"mode": "chat", "provider": "fireworks", "base_model": "gpt-oss-120b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "accounts/fireworks/models/gpt-oss-20b" : {"mode": "chat", "provider": "fireworks", "base_model": "gpt-oss-20b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/gpt-oss-safeguard-120b" : {"mode": "chat", "provider": "fireworks", "base_model": "gpt-oss-120b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/gpt-oss-safeguard-20b" : {"mode": "chat", "provider": "fireworks", "base_model": "gpt-oss-20b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/hermes-2-pro-mistral-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "hermes-2-pro-mistral-7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/internvl3-38b" : {"mode": "chat", "provider": "fireworks", "base_model": "internvl3-38b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/internvl3-78b" : {"mode": "chat", "provider": "fireworks", "base_model": "internvl3-78b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/internvl3-8b" : {"mode": "chat", "provider": "fireworks", "base_model": "internvl3-8b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/japanese-stable-diffusion-xl" : {"mode": "image_generation", "provider": "fireworks", "base_model": "japanese-stable-diffusion-xl", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000000013, "output_cost_per_token": 0.00000000013}, "accounts/fireworks/models/kat-coder" : {"mode": "chat", "provider": "fireworks", "base_model": "kat-coder", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/kat-dev-32b" : {"mode": "chat", "provider": "fireworks", "base_model": "kat-dev-32b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/kat-dev-72b-exp" : {"mode": "chat", "provider": "fireworks", "base_model": "kat-dev-72b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/kimi-k2-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "kimi-k2-instruct", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "accounts/fireworks/models/kimi-k2-instruct-0905" : {"mode": "chat", "provider": "fireworks", "base_model": "kimi-k2-instruct", "max_input_tokens": 262144, "max_output_tokens": 32768, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "accounts/fireworks/models/kimi-k2-thinking" : {"mode": "chat", "provider": "fireworks", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "accounts/fireworks/models/kimi-k2p5" : {"mode": "chat", "provider": "fireworks", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000003, "cache_read_input_token_cost": 0.0000001}, "accounts/fireworks/models/llama-guard-2-8b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-guard-2-8b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llama-guard-3-1b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-guard-3-1b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/llama-guard-3-8b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-guard-3-8b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llama-v2-13b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-2-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llama-v2-13b-chat" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-2-13b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llama-v2-70b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-2-70b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/llama-v2-70b-chat" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-2-70b-chat", "max_input_tokens": 2048, "max_output_tokens": 2048, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/llama-v2-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-2-7b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llama-v2-7b-chat" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-2-7b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llama-v3-70b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/llama-v3-70b-instruct-hf" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/llama-v3-8b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3-8b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llama-v3-8b-instruct-hf" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llama-v3p1-405b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.1-405b-instruct", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000003}, "accounts/fireworks/models/llama-v3p1-405b-instruct-long" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.1-405b-instruct-long", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/llama-v3p1-70b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.1-70b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/llama-v3p1-70b-instruct-1b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.1-70b-instruct-1b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/llama-v3p1-8b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/llama-v3p1-nemotron-70b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.1-nemotron-70b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/llama-v3p2-11b-vision-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.2-11b-vision-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llama-v3p2-1b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.2-1b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/llama-v3p2-1b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.2-1b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/llama-v3p2-3b" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.2-3b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/llama-v3p2-3b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.2-3b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/llama-v3p2-90b-vision-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.2-90b-vision-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/llama-v3p3-70b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-3.3-70b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/llama4-maverick-instruct-basic" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-4-maverick-instruct-basic", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000088}, "accounts/fireworks/models/llama4-scout-instruct-basic" : {"mode": "chat", "provider": "fireworks", "base_model": "llama-4-scout-instruct-basic", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "accounts/fireworks/models/llamaguard-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "llamaguard-7b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/llava-yi-34b" : {"mode": "chat", "provider": "fireworks", "base_model": "llava-yi-34b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/minimax-m1-80k" : {"mode": "chat", "provider": "fireworks", "base_model": "minimax-m1-80k", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/minimax-m2" : {"mode": "chat", "provider": "fireworks", "base_model": "minimax-m2", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/minimax-m2p1" : {"mode": "chat", "provider": "fireworks", "base_model": "minimax-m2.1", "max_input_tokens": 204800, "max_output_tokens": 204800, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000003}, "accounts/fireworks/models/ministral-3-14b-instruct-2512" : {"mode": "chat", "provider": "fireworks", "base_model": "ministral-3-14b-instruct", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/ministral-3-3b-instruct-2512" : {"mode": "chat", "provider": "fireworks", "base_model": "ministral-3-3b-instruct", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/ministral-3-8b-instruct-2512" : {"mode": "chat", "provider": "fireworks", "base_model": "ministral-3-8b-instruct", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/mistral-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "mistral-7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/mistral-7b-instruct-4k" : {"mode": "chat", "provider": "fireworks", "base_model": "mistral-7b-instruct-4k", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/mistral-7b-instruct-v0p2" : {"mode": "chat", "provider": "fireworks", "base_model": "mistral-7b-instruct-v0.2", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/mistral-7b-instruct-v3" : {"mode": "chat", "provider": "fireworks", "base_model": "mistral-7b-instruct-v3", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/mistral-7b-v0p2" : {"mode": "chat", "provider": "fireworks", "base_model": "mistral-7b-v0.2", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/mistral-large-3-fp8" : {"mode": "chat", "provider": "fireworks", "base_model": "mistral-large-3-fp8", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/mistral-nemo-base-2407" : {"mode": "chat", "provider": "fireworks", "base_model": "mistral-nemo-base", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/mistral-nemo-instruct-2407" : {"mode": "chat", "provider": "fireworks", "base_model": "mistral-nemo-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/mistral-small-24b-instruct-2501" : {"mode": "chat", "provider": "fireworks", "base_model": "mistral-small-24b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/mixtral-8x22b" : {"mode": "chat", "provider": "fireworks", "base_model": "mixtral-8x22b", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/mixtral-8x22b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "mixtral-8x22b-instruct", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/mixtral-8x22b-instruct-hf" : {"mode": "chat", "provider": "fireworks", "base_model": "mixtral-8x22b-instruct", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "accounts/fireworks/models/mixtral-8x7b" : {"mode": "chat", "provider": "fireworks", "base_model": "mixtral-8x7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/mixtral-8x7b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/mixtral-8x7b-instruct-hf" : {"mode": "chat", "provider": "fireworks", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/mythomax-l2-13b" : {"mode": "chat", "provider": "fireworks", "base_model": "mythomax-l2-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/nemotron-nano-v2-12b-vl" : {"mode": "chat", "provider": "fireworks", "base_model": "nemotron-nano-v2-12b-vl", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/nous-capybara-7b-v1p9" : {"mode": "chat", "provider": "fireworks", "base_model": "nous-capybara-7b-v1.9", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/nous-hermes-2-mixtral-8x7b-dpo" : {"mode": "chat", "provider": "fireworks", "base_model": "nous-hermes-2-mixtral-8x7b-dpo", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/nous-hermes-2-yi-34b" : {"mode": "chat", "provider": "fireworks", "base_model": "nous-hermes-2-yi-34b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/nous-hermes-llama2-13b" : {"mode": "chat", "provider": "fireworks", "base_model": "nous-hermes-llama2-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/nous-hermes-llama2-70b" : {"mode": "chat", "provider": "fireworks", "base_model": "nous-hermes-llama2-70b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/nous-hermes-llama2-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "nous-hermes-llama2-7b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/nvidia-nemotron-nano-12b-v2" : {"mode": "chat", "provider": "fireworks", "base_model": "nvidia-nemotron-nano-12b-v2", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/nvidia-nemotron-nano-9b-v2" : {"mode": "chat", "provider": "fireworks", "base_model": "nvidia-nemotron-nano-9b-v2", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/openchat-3p5-0106-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "openchat-3.5-0106-7b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/openhermes-2-mistral-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "openhermes-2-mistral-7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/openhermes-2p5-mistral-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "openhermes-2.5-mistral-7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/openorca-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "openorca-7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/phi-2-3b" : {"mode": "chat", "provider": "fireworks", "base_model": "phi-2-3b", "max_input_tokens": 2048, "max_output_tokens": 2048, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/phi-3-mini-128k-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "phi-3-mini-128k-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/phi-3-vision-128k-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "phi-3-vision-128k-instruct", "max_input_tokens": 32064, "max_output_tokens": 32064, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/phind-code-llama-34b-python-v1" : {"mode": "chat", "provider": "fireworks", "base_model": "phind-code-llama-34b-python-v1", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/phind-code-llama-34b-v1" : {"mode": "chat", "provider": "fireworks", "base_model": "phind-code-llama-34b-v1", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/phind-code-llama-34b-v2" : {"mode": "chat", "provider": "fireworks", "base_model": "phind-code-llama-34b-v2", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/playground-v2-1024px-aesthetic" : {"mode": "image_generation", "provider": "fireworks", "base_model": "playground-v2-1024px-aesthetic", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000000013, "output_cost_per_token": 0.00000000013}, "accounts/fireworks/models/playground-v2-5-1024px-aesthetic" : {"mode": "image_generation", "provider": "fireworks", "base_model": "playground-v2-5-1024px-aesthetic", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000000013, "output_cost_per_token": 0.00000000013}, "accounts/fireworks/models/pythia-12b" : {"mode": "chat", "provider": "fireworks", "base_model": "pythia-12b", "max_input_tokens": 2048, "max_output_tokens": 2048, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen-qwq-32b-preview" : {"mode": "chat", "provider": "fireworks", "base_model": "qwq-32b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen-v2p5-14b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-14b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen-v2p5-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-7b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen1p5-72b-chat" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen1.5-72b-chat", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2-72b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2-72b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2-7b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2-7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen2-vl-2b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2-vl-2b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen2-vl-72b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2-vl-72b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2-vl-7b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2-vl-7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen2p5-0p5b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-0.5b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen2p5-14b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-14b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen2p5-1p5b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-1.5b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen2p5-32b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-32b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-32b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-32b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-72b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-72b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-72b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-72b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-7b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen2p5-coder-0p5b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-0.5b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen2p5-coder-0p5b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-0.5b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen2p5-coder-14b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-14b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen2p5-coder-14b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-14b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen2p5-coder-1p5b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-1.5b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen2p5-coder-1p5b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-1.5b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen2p5-coder-32b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-32b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-coder-32b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-32b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-coder-32b-instruct-128k" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-32b-instruct-128k", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-coder-32b-instruct-32k-rope" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-32b-instruct-32k-rope", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-coder-32b-instruct-64k" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-32b-instruct-64k", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-coder-3b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-3b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen2p5-coder-3b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-3b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen2p5-coder-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen2p5-coder-7b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-coder-7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen2p5-math-72b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-math-72b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-vl-32b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-vl-32b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-vl-3b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-vl-3b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen2p5-vl-72b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-vl-72b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen2p5-vl-7b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen2.5-vl-7b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen3-0p6b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-0.6b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen3-14b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-14b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen3-1p7b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-1.7b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen3-1p7b-fp8-draft" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-1.7b-fp8-draft", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen3-1p7b-fp8-draft-131072" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-1.7b-fp8-draft-131072", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen3-1p7b-fp8-draft-40960" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-1.7b-fp8-draft-40960", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/qwen3-235b-a22b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-235b-a22b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000088}, "accounts/fireworks/models/qwen3-235b-a22b-instruct-2507" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-235b-a22b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000088}, "accounts/fireworks/models/qwen3-235b-a22b-thinking-2507" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-235b-a22b-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000088}, "accounts/fireworks/models/qwen3-30b-a3b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-30b-a3b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "accounts/fireworks/models/qwen3-30b-a3b-instruct-2507" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-30b-a3b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "accounts/fireworks/models/qwen3-30b-a3b-thinking-2507" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-30b-a3b-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen3-32b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-32b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen3-4b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-4b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen3-4b-instruct-2507" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-4b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen3-8b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-8b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwen3-coder-30b-a3b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-coder-30b-a3b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-coder-480b-a35b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000018}, "accounts/fireworks/models/qwen3-coder-480b-instruct-bf16" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-coder-480b-instruct-bf16", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen3-embedding-0p6b" : {"mode": "embedding", "provider": "fireworks", "base_model": "qwen3-embedding-0.6b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "accounts/fireworks/models/qwen3-embedding-4b" : {"mode": "embedding", "provider": "fireworks", "base_model": "qwen3-embedding-4b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0, "output_cost_per_token": 0}, "accounts/fireworks/models/qwen3-embedding-8b" : {"mode": "embedding", "provider": "fireworks", "base_model": "qwen3-embedding-8b", "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "input_cost_per_audio_token": 0}, "accounts/fireworks/models/qwen3-next-80b-a3b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-next-80b-a3b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen3-next-80b-a3b-thinking" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-next-80b-a3b-thinking", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen3-reranker-0p6b" : {"mode": "rerank", "provider": "fireworks", "base_model": "qwen3-reranker-0.6b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0, "output_cost_per_token": 0}, "accounts/fireworks/models/qwen3-reranker-4b" : {"mode": "rerank", "provider": "fireworks", "base_model": "qwen3-reranker-4b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0, "output_cost_per_token": 0}, "accounts/fireworks/models/qwen3-reranker-8b" : {"mode": "rerank", "provider": "fireworks", "base_model": "qwen3-reranker-8b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0, "output_cost_per_token": 0}, "accounts/fireworks/models/qwen3-vl-235b-a22b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-vl-235b-a22b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000088}, "accounts/fireworks/models/qwen3-vl-235b-a22b-thinking" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-vl-235b-a22b-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000088}, "accounts/fireworks/models/qwen3-vl-30b-a3b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-vl-30b-a3b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "accounts/fireworks/models/qwen3-vl-30b-a3b-thinking" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-vl-30b-a3b-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "accounts/fireworks/models/qwen3-vl-32b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-vl-32b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/qwen3-vl-8b-instruct" : {"mode": "chat", "provider": "fireworks", "base_model": "qwen3-vl-8b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/qwq-32b" : {"mode": "chat", "provider": "fireworks", "base_model": "qwq-32b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/rolm-ocr" : {"mode": "chat", "provider": "fireworks", "base_model": "rolm-ocr", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/snorkel-mistral-7b-pairrm-dpo" : {"mode": "chat", "provider": "fireworks", "base_model": "snorkel-mistral-7b-pairrm-dpo", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/stable-diffusion-xl-1024-v1-0" : {"mode": "image_generation", "provider": "fireworks", "base_model": "stable-diffusion-xl-1024-v1-0", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000000013, "output_cost_per_token": 0.00000000013}, "accounts/fireworks/models/stablecode-3b" : {"mode": "chat", "provider": "fireworks", "base_model": "stablecode-3b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/starcoder-16b" : {"mode": "chat", "provider": "fireworks", "base_model": "starcoder-16b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/starcoder-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "starcoder-7b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/starcoder2-15b" : {"mode": "chat", "provider": "fireworks", "base_model": "starcoder2-15b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/starcoder2-3b" : {"mode": "chat", "provider": "fireworks", "base_model": "starcoder2-3b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "accounts/fireworks/models/starcoder2-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "starcoder2-7b", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/toppy-m-7b" : {"mode": "chat", "provider": "fireworks", "base_model": "toppy-m-7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/whisper-v3" : {"mode": "audio_transcription", "provider": "fireworks", "base_model": "whisper-v3", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "accounts/fireworks/models/whisper-v3-turbo" : {"mode": "audio_transcription", "provider": "fireworks", "base_model": "whisper-v3-turbo", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "accounts/fireworks/models/yi-34b" : {"mode": "chat", "provider": "fireworks", "base_model": "yi-34b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/yi-34b-200k-capybara" : {"mode": "chat", "provider": "fireworks", "base_model": "yi-34b-200k-capybara", "max_input_tokens": 200000, "max_output_tokens": 200000, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/yi-34b-chat" : {"mode": "chat", "provider": "fireworks", "base_model": "yi-34b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "accounts/fireworks/models/yi-6b" : {"mode": "chat", "provider": "fireworks", "base_model": "yi-6b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "accounts/fireworks/models/yi-large" : {"mode": "chat", "provider": "fireworks", "base_model": "yi-large", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000003}, "accounts/fireworks/models/zephyr-7b-beta" : {"mode": "chat", "provider": "fireworks", "base_model": "zephyr-7b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "ada" : {"mode": "embedding", "provider": "azure", "base_model": "ada", "max_input_tokens": 8191, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "ai21.j2-mid-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "j2-mid-v1", "max_input_tokens": 8191, "max_output_tokens": 8191, "input_cost_per_token": 0.0000125, "output_cost_per_token": 0.0000125}, "ai21.j2-ultra-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "j2-ultra-v1", "max_input_tokens": 8191, "max_output_tokens": 8191, "input_cost_per_token": 0.0000188, "output_cost_per_token": 0.0000188}, "ai21.jamba-1-5-large-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "jamba-1-5-large", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "ai21.jamba-1-5-mini-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "jamba-1-5-mini", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004}, "ai21.jamba-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "jamba-instruct", "max_input_tokens": 70000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000007}, "ai21/jamba-large-1.7" : {"mode": "chat", "provider": "openrouter", "base_model": "jamba-large-1.7", "max_input_tokens": 256000, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "aion-labs/aion-1.0" : {"mode": "chat", "provider": "openrouter", "base_model": "aion-1.0", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000008}, "aion-labs/aion-1.0-mini" : {"mode": "chat", "provider": "openrouter", "base_model": "aion-1.0-mini", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000014}, "aion-labs/aion-2.0" : {"mode": "chat", "provider": "openrouter", "base_model": "aion-2.0", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000016, "cache_read_input_token_cost": 0.0000002}, "aion-labs/aion-rp-llama-3.1-8b" : {"mode": "chat", "provider": "openrouter", "base_model": "aion-rp-llama-3.1-8b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000016}, "aisingapore/Gemma-SEA-LION-v4-27B-IT" : {"mode": "chat", "provider": "publicai", "base_model": "gemma-sea-lion-v4-27b-it", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "aisingapore/Qwen-SEA-LION-v4-32B-IT" : {"mode": "chat", "provider": "publicai", "base_model": "qwen-sea-lion-v4-32b-it", "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "alibaba-qwen3-32b" : {"mode": "chat", "provider": "gradient_ai", "base_model": "qwen3-32b", "max_input_tokens": 131072, "max_output_tokens": 40960}, "alibaba/qwen-3-14b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "qwen3-14b", "max_input_tokens": 40960, "max_output_tokens": 16384, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000024}, "alibaba/qwen-3-235b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "qwen3-235b", "max_input_tokens": 40960, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "alibaba/qwen-3-30b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "qwen3-30b", "max_input_tokens": 40960, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "alibaba/qwen-3-32b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "qwen3-32b", "max_input_tokens": 40960, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "alibaba/qwen3-coder" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "qwen3-coder", "max_input_tokens": 262144, "max_output_tokens": 66536, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000016}, "allenai/Olmo-3-32B-Think" : {"mode": "chat", "provider": "publicai", "base_model": "olmo-3-32b-think", "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "allenai/Olmo-3-7B-Instruct" : {"mode": "chat", "provider": "publicai", "base_model": "olmo-3-7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "allenai/Olmo-3-7B-Think" : {"mode": "chat", "provider": "publicai", "base_model": "olmo-3-7b-think", "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "allenai/olmOCR-7B-0725-FP8" : {"mode": "chat", "provider": "deepinfra", "base_model": "olmocr-7b-0725-fp8", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.0000015}, "allenai/olmo-3-32b-think" : {"mode": "chat", "provider": "openrouter", "base_model": "olmo-3-32b-think", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000005}, "amazon.nova-2-lite-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-2-lite", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.000000075}, "amazon.nova-2-multimodal-embeddings-v1:0" : {"mode": "embedding", "provider": "bedrock", "base_model": "nova-2-multimodal-embeddings", "max_input_tokens": 8172, "input_cost_per_image": 0.00006, "input_cost_per_token": 0.000000135, "output_cost_per_token": 0, "input_cost_per_audio_per_second": 0.00014, "input_cost_per_video_per_second": 0.0007}, "amazon.nova-2-pro-preview-20251202-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-2-pro", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000021875, "output_cost_per_token": 0.0000175, "input_cost_per_audio_token": 0.0000021875, "input_cost_per_image_token": 0.0000021875, "cache_read_input_token_cost": 0.000000546875}, "amazon.nova-canvas-v1:0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "nova-canvas", "max_input_tokens": 2600, "output_cost_per_image": 0.06}, "amazon.nova-lite-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-lite", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000024}, "amazon.nova-micro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-micro", "max_input_tokens": 128000, "max_output_tokens": 10000, "input_cost_per_token": 0.000000035, "output_cost_per_token": 0.00000014}, "amazon.nova-pro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-pro", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000032}, "amazon.rerank-v1:0" : {"mode": "rerank", "provider": "bedrock", "base_model": "rerank", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "amazon.titan-embed-image-v1" : {"mode": "embedding", "provider": "bedrock", "base_model": "titan-embed-image-v1", "max_input_tokens": 128, "input_cost_per_image": 0.00006, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0}, "amazon.titan-embed-text-v1" : {"mode": "embedding", "provider": "bedrock", "base_model": "titan-embed-text-v1", "max_input_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "amazon.titan-embed-text-v2:0" : {"mode": "embedding", "provider": "bedrock", "base_model": "titan-embed-text", "max_input_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0}, "amazon.titan-image-generator-v1" : {"mode": "image_generation", "provider": "bedrock", "base_model": "titan-image-generator-v1", "input_cost_per_image": 0, "output_cost_per_image": 0.008, "output_cost_per_image_premium_image": 0.01, "output_cost_per_image_above_512_and_512_pixels": 0.01, "output_cost_per_image_above_512x512_pixels_premium": 0.012}, "amazon.titan-image-generator-v2" : {"mode": "image_generation", "provider": "bedrock", "base_model": "titan-image-generator-v2", "input_cost_per_image": 0, "output_cost_per_image": 0.008, "output_cost_per_image_premium_image": 0.01, "output_cost_per_image_above_1024_and_1024_pixels": 0.01, "output_cost_per_image_above_1024x1024_pixels_premium": 0.012}, "amazon.titan-image-generator-v2:0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "titan-image-generator", "input_cost_per_image": 0, "output_cost_per_image": 0.008, "output_cost_per_image_premium_image": 0.01, "output_cost_per_image_above_1024_and_1024_pixels": 0.01, "output_cost_per_image_above_1024x1024_pixels_premium": 0.012}, "amazon.titan-text-express-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "titan-text-express-v1", "max_input_tokens": 42000, "max_output_tokens": 8000, "input_cost_per_token": 0.0000013, "output_cost_per_token": 0.0000017}, "amazon.titan-text-lite-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "titan-text-lite-v1", "max_input_tokens": 42000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000004}, "amazon.titan-text-premier-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "titan-text-premier", "max_input_tokens": 42000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "amazon/nova-2-lite-v1" : {"mode": "chat", "provider": "openrouter", "base_model": "nova-2-lite-v1", "max_input_tokens": 1000000, "max_output_tokens": 65535, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025}, "amazon/nova-lite" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "nova-lite", "max_input_tokens": 300000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000024}, "amazon/nova-lite-v1" : {"mode": "chat", "provider": "openrouter", "base_model": "nova-lite-v1", "max_input_tokens": 300000, "max_output_tokens": 5120, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000024}, "amazon/nova-micro" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "nova-micro", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.000000035, "output_cost_per_token": 0.00000014}, "amazon/nova-micro-v1" : {"mode": "chat", "provider": "openrouter", "base_model": "nova-micro-v1", "max_input_tokens": 128000, "max_output_tokens": 5120, "input_cost_per_token": 0.000000035, "output_cost_per_token": 0.00000014}, "amazon/nova-premier-v1" : {"mode": "chat", "provider": "openrouter", "base_model": "nova-premier-v1", "max_input_tokens": 1000000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.0000125, "cache_read_input_token_cost": 0.000000625}, "amazon/nova-pro" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "nova-pro", "max_input_tokens": 300000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000032}, "amazon/nova-pro-v1" : {"mode": "chat", "provider": "openrouter", "base_model": "nova-pro-v1", "max_input_tokens": 300000, "max_output_tokens": 5120, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000032}, "amazon/titan-embed-text-v2" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "titan-embed-text-v2", "max_input_tokens": 0, "max_output_tokens": 0, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0}, "anthracite-org/magnum-v4-72b" : {"mode": "chat", "provider": "openrouter", "base_model": "magnum-v4-72b", "max_input_tokens": 16384, "max_output_tokens": 2048, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000005}, "anthropic-claude-3-opus" : {"mode": "chat", "provider": "gradient_ai", "base_model": "claude-3-opus", "max_input_tokens": 200000, "max_output_tokens": 1024, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075}, "anthropic-claude-3.5-haiku" : {"mode": "chat", "provider": "gradient_ai", "base_model": "claude-3-5-haiku", "max_input_tokens": 200000, "max_output_tokens": 1024, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.000004}, "anthropic-claude-3.5-sonnet" : {"mode": "chat", "provider": "gradient_ai", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 1024, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "anthropic-claude-3.7-sonnet" : {"mode": "chat", "provider": "gradient_ai", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 1024, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "anthropic.claude-3-5-haiku-20241022-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-haiku", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.000004, "cache_read_input_token_cost": 0.00000008, "cache_creation_input_token_cost": 0.000001}, "anthropic.claude-3-5-sonnet-20240620-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 1000000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.00003, "cache_creation_input_token_cost_above_1hr": 0.0000075, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075, "cache_creation_input_token_cost_above_1hr_above_200k_tokens": 0.000015}, "anthropic.claude-3-5-sonnet-20241022-v2:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.00003, "cache_creation_input_token_cost_above_1hr": 0.0000075, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075, "cache_creation_input_token_cost_above_1hr_above_200k_tokens": 0.000015}, "anthropic.claude-3-7-sonnet-20240620-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000036, "output_cost_per_token": 0.000018, "cache_read_input_token_cost": 0.00000036, "cache_creation_input_token_cost": 0.0000045}, "anthropic.claude-3-7-sonnet-20250219-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "anthropic.claude-3-haiku-20240307-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "cache_read_input_token_cost": 0.000000025, "cache_creation_input_token_cost": 0.0000003125}, "anthropic.claude-3-opus-20240229-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-opus", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "anthropic.claude-3-sonnet-20240229-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "anthropic.claude-haiku-4-5-20251001-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.0000001, "cache_creation_input_token_cost": 0.00000125, "cache_creation_input_token_cost_above_1hr": 0.000002}, "anthropic.claude-haiku-4-5@20251001" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.0000001, "cache_creation_input_token_cost": 0.00000125, "cache_creation_input_token_cost_above_1hr": 0.000002}, "anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000024}, "anthropic.claude-mythos-preview" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-mythos", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "anthropic.claude-opus-4-1-20250805-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-1", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "anthropic.claude-opus-4-20250514-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "anthropic.claude-opus-4-5-20251101-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "anthropic.claude-opus-4-6-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-6", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "anthropic.claude-opus-4-7" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-7", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "anthropic.claude-opus-4-8" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-8", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "anthropic.claude-sonnet-4-20250514-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "anthropic.claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_creation_input_token_cost_above_1hr": 0.000006, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075, "cache_creation_input_token_cost_above_1hr_above_200k_tokens": 0.000012}, "anthropic.claude-sonnet-4-6" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-6", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "anthropic/claude-3-5-sonnet" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "anthropic/claude-3-5-sonnet-20241022" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "anthropic/claude-3-7-sonnet" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "anthropic/claude-3-7-sonnet-latest" : {"mode": "chat", "provider": "deepinfra", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 200000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033}, "anthropic/claude-3-haiku" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_image": 0.0004, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.0000003}, "anthropic/claude-3-opus" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-3-opus", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "anthropic/claude-3.5-haiku" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-3.5-haiku", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.000004, "cache_read_input_token_cost": 0.00000008, "cache_creation_input_token_cost": 0.000001}, "anthropic/claude-3.5-sonnet" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "anthropic/claude-3.7-sonnet" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_image": 0.0048, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "anthropic/claude-4-opus" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-opus-4", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "anthropic/claude-4-sonnet" : {"mode": "chat", "provider": "deepinfra", "base_model": "claude-sonnet-4", "max_input_tokens": 200000, "max_output_tokens": 200000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165}, "anthropic/claude-4.5-haiku" : {"mode": "chat", "provider": "replicate", "base_model": "claude-haiku-4-5", "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005}, "anthropic/claude-4.5-sonnet" : {"mode": "chat", "provider": "replicate", "base_model": "claude-sonnet-4-5", "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "anthropic/claude-haiku-4-5" : {"mode": "responses", "provider": "perplexity", "base_model": "claude-haiku-4-5"}, "anthropic/claude-haiku-4.5" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.0000001, "cache_creation_input_token_cost": 0.00000125}, "anthropic/claude-opus-4" : {"mode": "chat", "provider": "gmi", "base_model": "claude-opus-4", "max_input_tokens": 409600, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075}, "anthropic/claude-opus-4-5" : {"mode": "responses", "provider": "perplexity", "base_model": "claude-opus-4-5"}, "anthropic/claude-opus-4-6" : {"mode": "responses", "provider": "perplexity", "base_model": "claude-opus-4-6"}, "anthropic/claude-opus-4-7" : {"mode": "responses", "provider": "perplexity", "base_model": "claude-opus-4-7"}, "anthropic/claude-opus-4.1" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-opus-4-1", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_image": 0.0048, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875, "cache_creation_input_token_cost_above_1hr": 0.00003}, "anthropic/claude-opus-4.5" : {"mode": "chat", "provider": "gmi", "base_model": "claude-opus-4-5", "max_input_tokens": 409600, "max_output_tokens": 32000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025}, "anthropic/claude-opus-4.6" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-opus-4-6", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "anthropic/claude-opus-4.6-fast" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-opus-4.6-fast", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00015, "cache_read_input_token_cost": 0.000003, "cache_creation_input_token_cost": 0.0000375}, "anthropic/claude-opus-4.7" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-opus-4-7", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "anthropic/claude-opus-4.7-fast" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-opus-4.7-fast", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00015, "cache_read_input_token_cost": 0.000003, "cache_creation_input_token_cost": 0.0000375}, "anthropic/claude-opus-4.8" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-opus-4.8", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "anthropic/claude-opus-4.8-fast" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-opus-4.8-fast", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00005, "cache_read_input_token_cost": 0.000001, "cache_creation_input_token_cost": 0.0000125}, "anthropic/claude-sonnet-4" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-sonnet-4", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "anthropic/claude-sonnet-4-5" : {"mode": "responses", "provider": "perplexity", "base_model": "claude-sonnet-4-5"}, "anthropic/claude-sonnet-4.5" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "claude-sonnet-4-5", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "anthropic/claude-sonnet-4.6" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-sonnet-4-6", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.01475, "output_cost_per_second": 0.01475}, "ap-northeast-1/1-month-commitment/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0455, "output_cost_per_second": 0.0455}, "ap-northeast-1/1-month-commitment/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0455, "output_cost_per_second": 0.0455}, "ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.008194, "output_cost_per_second": 0.008194}, "ap-northeast-1/6-month-commitment/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02527, "output_cost_per_second": 0.02527}, "ap-northeast-1/6-month-commitment/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02527, "output_cost_per_second": 0.02527}, "ap-northeast-1/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000223, "output_cost_per_token": 0.00000755}, "ap-northeast-1/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "ap-northeast-1/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "ap-northeast-1/deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000074, "output_cost_per_token": 0.00000222}, "ap-northeast-1/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "ap-northeast-1/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "ap-northeast-1/moonshotai.kimi-k2-thinking" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000073, "output_cost_per_token": 0.00000303}, "ap-northeast-1/moonshotai.kimi-k2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.0000036}, "ap-northeast-1/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.00000144}, "ap-south-1/deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000074, "output_cost_per_token": 0.00000222}, "ap-south-1/meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000318, "output_cost_per_token": 0.0000042}, "ap-south-1/meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000072}, "ap-south-1/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "ap-south-1/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "ap-south-1/moonshotai.kimi-k2-thinking" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000071, "output_cost_per_token": 0.00000294}, "ap-south-1/moonshotai.kimi-k2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.0000036}, "ap-south-1/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.00000144}, "ap-southeast-2/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.000000309, "output_cost_per_token": 0.000001236}, "ap-southeast-3/deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000074, "output_cost_per_token": 0.00000222}, "ap-southeast-3/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "ap-southeast-3/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "ap-southeast-3/moonshotai.kimi-k2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.0000036}, "ap-southeast-3/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.00000144}, "apac.amazon.nova-2-lite-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-2-lite", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.00000033, "output_cost_per_token": 0.00000275, "cache_read_input_token_cost": 0.0000000825}, "apac.amazon.nova-2-pro-preview-20251202-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-2-pro", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000021875, "output_cost_per_token": 0.0000175, "input_cost_per_audio_token": 0.0000021875, "input_cost_per_image_token": 0.0000021875, "cache_read_input_token_cost": 0.000000546875}, "apac.amazon.nova-lite-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-lite", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.000000063, "output_cost_per_token": 0.000000252}, "apac.amazon.nova-micro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-micro", "max_input_tokens": 128000, "max_output_tokens": 10000, "input_cost_per_token": 0.000000037, "output_cost_per_token": 0.000000148}, "apac.amazon.nova-pro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-pro", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.00000084, "output_cost_per_token": 0.00000336}, "apac.anthropic.claude-3-5-sonnet-20240620-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "apac.anthropic.claude-3-5-sonnet-20241022-v2:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "apac.anthropic.claude-3-haiku-20240307-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "cache_read_input_token_cost": 0.000000025, "cache_creation_input_token_cost": 0.0000003125}, "apac.anthropic.claude-3-sonnet-20240229-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "apac.anthropic.claude-haiku-4-5-20251001-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000055, "cache_read_input_token_cost": 0.00000011, "cache_creation_input_token_cost": 0.000001375}, "apac.anthropic.claude-sonnet-4-20250514-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "arcee-ai/coder-large" : {"mode": "chat", "provider": "openrouter", "base_model": "coder-large", "max_input_tokens": 32768, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000008}, "arcee-ai/maestro-reasoning" : {"mode": "chat", "provider": "openrouter", "base_model": "maestro-reasoning", "max_input_tokens": 131072, "max_output_tokens": 32000, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000033}, "arcee-ai/spotlight" : {"mode": "chat", "provider": "openrouter", "base_model": "spotlight", "max_input_tokens": 131072, "max_output_tokens": 65537, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000018}, "arcee-ai/trinity-large-thinking" : {"mode": "chat", "provider": "openrouter", "base_model": "trinity-large-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000085, "cache_read_input_token_cost": 0.00000006}, "arcee-ai/trinity-mini" : {"mode": "chat", "provider": "openrouter", "base_model": "trinity-mini", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000000045, "output_cost_per_token": 0.00000015}, "arcee-ai/virtuoso-large" : {"mode": "chat", "provider": "openrouter", "base_model": "virtuoso-large", "max_input_tokens": 131072, "max_output_tokens": 64000, "input_cost_per_token": 0.00000075, "output_cost_per_token": 0.0000012}, "au.anthropic.claude-haiku-4-5-20251001-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000055, "cache_read_input_token_cost": 0.00000011, "cache_creation_input_token_cost": 0.000001375}, "au.anthropic.claude-opus-4-6-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-6", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.0000275, "cache_read_input_token_cost": 0.00000055, "cache_creation_input_token_cost": 0.000006875}, "au.anthropic.claude-opus-4-7" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-7", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.0000275, "cache_read_input_token_cost": 0.00000055, "cache_creation_input_token_cost": 0.000006875}, "au.anthropic.claude-opus-4-8" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-8", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.0000275, "cache_read_input_token_cost": 0.00000055, "cache_creation_input_token_cost": 0.000006875, "cache_creation_input_token_cost_above_1hr": 0.000011}, "au.anthropic.claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125, "input_cost_per_token_above_200k_tokens": 0.0000066, "output_cost_per_token_above_200k_tokens": 0.00002475, "cache_read_input_token_cost_above_200k_tokens": 0.00000066, "cache_creation_input_token_cost_above_200k_tokens": 0.00000825}, "au.anthropic.claude-sonnet-4-6" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-6", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125}, "baai/bge-base-en-v1.5" : {"mode": "embedding", "provider": "together_ai", "base_model": "bge-base-en", "max_input_tokens": 512, "input_cost_per_token": 0.000000008, "output_cost_per_token": 0}, "baai/bge-large-en-v1.5" : {"mode": "chat", "provider": "openrouter", "base_model": "bge-large-en-v1.5", "max_input_tokens": 512, "input_cost_per_token": 0.00000001}, "baai/bge-m3" : {"mode": "chat", "provider": "openrouter", "base_model": "bge-m3", "max_input_tokens": 8192, "input_cost_per_token": 0.00000001}, "baai/bge-reranker-v2-m3" : {"mode": "rerank", "provider": "novita", "base_model": "bge-reranker-v2-m3", "max_input_tokens": 8000, "max_output_tokens": 8000, "input_cost_per_token": 0.00000001, "output_cost_per_token": 0.00000001}, "babbage-002" : {"mode": "completion", "provider": "text-completion-openai", "base_model": "babbage-002", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000004}, "baichuan/baichuan-m2-32b" : {"mode": "chat", "provider": "novita", "base_model": "baichuan-m2-32b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000007}, "baidu/ernie-4.5-21B-a3b" : {"mode": "chat", "provider": "novita", "base_model": "ernie-4.5-21b-a3b", "max_input_tokens": 120000, "max_output_tokens": 8000, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028}, "baidu/ernie-4.5-21B-a3b-thinking" : {"mode": "chat", "provider": "novita", "base_model": "ernie-4.5-21b-a3b-thinking", "max_input_tokens": 131072, "max_output_tokens": 65536, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028}, "baidu/ernie-4.5-300b-a47b-paddle" : {"mode": "chat", "provider": "novita", "base_model": "ernie-4.5-300b-a47b-paddle", "max_input_tokens": 123000, "max_output_tokens": 12000, "input_cost_per_token": 0.00000028, "output_cost_per_token": 0.0000011}, "baidu/ernie-4.5-vl-28b-a3b" : {"mode": "chat", "provider": "openrouter", "base_model": "ernie-4.5-vl-28b-a3b", "max_input_tokens": 30000, "max_output_tokens": 8000, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.00000056}, "baidu/ernie-4.5-vl-28b-a3b-thinking" : {"mode": "chat", "provider": "novita", "base_model": "ernie-4.5-vl-28b-a3b-thinking", "max_input_tokens": 131072, "max_output_tokens": 65536, "input_cost_per_token": 0.00000039, "output_cost_per_token": 0.00000039}, "baidu/ernie-4.5-vl-424b-a47b" : {"mode": "chat", "provider": "openrouter", "base_model": "ernie-4.5-vl-424b-a47b", "max_input_tokens": 123000, "max_output_tokens": 16000, "input_cost_per_token": 0.00000042, "output_cost_per_token": 0.00000125}, "base" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "base", "input_cost_per_second": 0.00020833, "output_cost_per_second": 0}, "base-conversationalai" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "base-conversationalai", "input_cost_per_second": 0.00020833, "output_cost_per_second": 0}, "base-finance" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "base-finance", "input_cost_per_second": 0.00020833, "output_cost_per_second": 0}, "base-general" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "base-general", "input_cost_per_second": 0.00020833, "output_cost_per_second": 0}, "base-meeting" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "base-meeting", "input_cost_per_second": 0.00020833, "output_cost_per_second": 0}, "base-phonecall" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "base-phonecall", "input_cost_per_second": 0.00020833, "output_cost_per_second": 0}, "base-video" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "base-video", "input_cost_per_second": 0.00020833, "output_cost_per_second": 0}, "base-voicemail" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "base-voicemail", "input_cost_per_second": 0.00020833, "output_cost_per_second": 0}, "best" : {"mode": "audio_transcription", "provider": "assemblyai", "base_model": "best", "input_cost_per_second": 0.00003333, "output_cost_per_second": 0}, "bigscience/mt0-xxl-13b" : {"mode": "chat", "provider": "watsonx", "base_model": "mt0-xxl-13b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0005, "output_cost_per_token": 0.002}, "black-forest-labs/FLUX.1-schnell" : {"mode": "image_generation", "provider": "nscale", "base_model": "flux.1-schnell", "input_cost_per_pixel": 0.0000000013, "output_cost_per_pixel": 0}, "black-forest-labs/flux-1.1-pro-ultra" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-1.1-pro-ultra", "output_cost_per_image": 0.06}, "black-forest-labs/flux-2-flex" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-2-flex", "input_cost_per_pixel": 0.00000006, "output_cost_per_pixel": 0.00000006}, "black-forest-labs/flux-2-klein-4b" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-2-klein-4b", "input_cost_per_pixel": 0.000000001, "output_cost_per_pixel": 0.000000001}, "black-forest-labs/flux-2-max" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-2-max", "input_cost_per_pixel": 0.00000003, "output_cost_per_pixel": 0.00000003}, "black-forest-labs/flux-2-pro" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-2-pro", "input_cost_per_pixel": 0.000000015, "output_cost_per_pixel": 0.000000015}, "black-forest-labs/flux-dev" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-dev", "output_cost_per_image": 0.025}, "black-forest-labs/flux-kontext-max" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-kontext-max", "output_cost_per_image": 0.08}, "black-forest-labs/flux-kontext-pro" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-kontext-pro", "output_cost_per_image": 0.04}, "black-forest-labs/flux-pro" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-pro", "output_cost_per_image": 0.055}, "black-forest-labs/flux-schnell" : {"mode": "image_generation", "provider": "replicate", "base_model": "flux-schnell", "output_cost_per_image": 0.003}, "bria/text-to-image/3.2" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "bria/text-to-image/3.2", "output_cost_per_image": 0.0398}, "bytedance-seed/seed-1.6" : {"mode": "chat", "provider": "openrouter", "base_model": "seed-1.6", "max_input_tokens": 262144, "max_output_tokens": 32768, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002}, "bytedance-seed/seed-1.6-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "seed-1.6-flash", "max_input_tokens": 262144, "max_output_tokens": 32768, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003}, "bytedance-seed/seed-2.0-lite" : {"mode": "chat", "provider": "openrouter", "base_model": "seed-2.0-lite", "max_input_tokens": 262144, "max_output_tokens": 131072, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002}, "bytedance-seed/seed-2.0-mini" : {"mode": "chat", "provider": "openrouter", "base_model": "seed-2.0-mini", "max_input_tokens": 262144, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004}, "bytedance/seedance-1-lite" : {"mode": "video_generation", "provider": "replicate", "base_model": "seedance-1-lite", "output_cost_per_video_per_second": 0.018}, "bytedance/seedance-1-pro" : {"mode": "video_generation", "provider": "replicate", "base_model": "seedance-1-pro", "output_cost_per_video_per_second": 0.03}, "bytedance/seedream-4" : {"mode": "image_generation", "provider": "replicate", "base_model": "seedream-4", "output_cost_per_image": 0.03}, "bytedance/seedream-5-lite" : {"mode": "image_generation", "provider": "replicate", "base_model": "seedream-5-lite", "output_cost_per_image": 0.035}, "bytedance/ui-tars-1.5-7b" : {"mode": "chat", "provider": "openrouter", "base_model": "ui-tars-1.5-7b", "max_input_tokens": 131072, "max_output_tokens": 2048, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000002, "cache_read_input_token_cost": 0.0000001}, "ca-central-1/meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000305, "output_cost_per_token": 0.00000403}, "ca-central-1/meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000069}, "canopylabs/orpheus-3b-0.1-ft" : {"mode": "chat", "provider": "openrouter", "base_model": "orpheus-3b-0.1-ft", "max_input_tokens": 4096, "input_cost_per_token": 0.000007}, "chat-bison" : {"mode": "chat", "provider": "palm", "base_model": "chat-bison", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125}, "chat-bison-001" : {"mode": "chat", "provider": "palm", "base_model": "chat-bison-001", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125}, "chatdolphin" : {"mode": "chat", "provider": "nlp_cloud", "base_model": "chatdolphin", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "chatgpt-4o-latest" : {"mode": "chat", "provider": "openai", "base_model": "chatgpt-4o", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015}, "chatgpt-image-latest" : {"mode": "image_generation", "provider": "openai", "base_model": "chatgpt-image", "input_cost_per_token": 0.000005, "input_cost_per_image_token": 0.00001, "cache_read_input_token_cost": 0.00000125, "output_cost_per_image_token": 0.00004, "cache_read_input_image_token_cost": 0.0000025}, "chirp" : {"mode": "audio_speech", "provider": "vertex", "base_model": "chirp", "input_cost_per_character": 0.00003}, "claude-3-5-haiku" : {"mode": "chat", "provider": "heroku", "base_model": "claude-3-5-haiku", "max_input_tokens": 200000, "max_output_tokens": 8192}, "claude-3-5-haiku@20241022" : {"mode": "chat", "provider": "vertex", "base_model": "claude-3-5-haiku", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005}, "claude-3-5-sonnet" : {"mode": "chat", "provider": "snowflake", "base_model": "claude-3-5-sonnet", "max_input_tokens": 18000, "max_output_tokens": 8192}, "claude-3-5-sonnet-latest" : {"mode": "chat", "provider": "heroku", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192}, "claude-3-5-sonnet@20240620" : {"mode": "chat", "provider": "vertex", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "claude-3-7-sonnet" : {"mode": "chat", "provider": "heroku", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192}, "claude-3-7-sonnet@20250219" : {"mode": "chat", "provider": "vertex", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "claude-3-haiku" : {"mode": "chat", "provider": "vertex", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125}, "claude-3-haiku-20240307" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.0000003, "cache_creation_input_token_cost_above_1hr": 0.000006}, "claude-3-haiku@20240307" : {"mode": "chat", "provider": "vertex", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125}, "claude-3-opus" : {"mode": "chat", "provider": "vertex", "base_model": "claude-3-opus", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075}, "claude-3-opus@20240229" : {"mode": "chat", "provider": "vertex", "base_model": "claude-3-opus", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075}, "claude-3-sonnet" : {"mode": "chat", "provider": "vertex", "base_model": "claude-3-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "claude-3-sonnet@20240229" : {"mode": "chat", "provider": "vertex", "base_model": "claude-3-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "claude-4-opus-20250514" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-opus-4", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "claude-4-sonnet" : {"mode": "chat", "provider": "heroku", "base_model": "claude-sonnet-4", "max_input_tokens": 200000, "max_output_tokens": 8192}, "claude-4-sonnet-20250514" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-sonnet-4", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "claude-haiku-4-5" : {"mode": "chat", "provider": "vertex", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.0000001, "cache_creation_input_token_cost": 0.00000125}, "claude-haiku-4-5-20251001" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.0000001, "cache_creation_input_token_cost": 0.00000125, "cache_creation_input_token_cost_above_1hr": 0.000002}, "claude-haiku-4-5@20251001" : {"mode": "chat", "provider": "vertex", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.0000001, "cache_creation_input_token_cost": 0.00000125}, "claude-haiku-4.5" : {"mode": "chat", "provider": "github_copilot", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 32000}, "claude-opus-4" : {"mode": "chat", "provider": "vertex", "base_model": "claude-opus-4", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "claude-opus-4-1" : {"mode": "chat", "provider": "vertex", "base_model": "claude-opus-4-1", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "input_cost_per_token_batches": 0.0000075, "output_cost_per_token_batches": 0.0000375, "cache_creation_input_token_cost": 0.00001875}, "claude-opus-4-1-20250805" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-opus-4-1", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875, "cache_creation_input_token_cost_above_1hr": 0.00003}, "claude-opus-4-1@20250805" : {"mode": "chat", "provider": "vertex", "base_model": "claude-opus-4-1", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "input_cost_per_token_batches": 0.0000075, "output_cost_per_token_batches": 0.0000375, "cache_creation_input_token_cost": 0.00001875}, "claude-opus-4-5" : {"mode": "chat", "provider": "vertex", "base_model": "claude-opus-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "claude-opus-4-5-20251101" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-opus-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "claude-opus-4-5@20251101" : {"mode": "chat", "provider": "vertex", "base_model": "claude-opus-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "claude-opus-4-6" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-opus-4-6", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "claude-opus-4-6@default" : {"mode": "chat", "provider": "vertex", "base_model": "claude-opus-4-6", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "claude-opus-4-7" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-opus-4-7", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "claude-opus-4-7-20260416" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-opus-4-7", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "claude-opus-4-7@default" : {"mode": "chat", "provider": "vertex", "base_model": "claude-opus-4-7", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "claude-opus-4-8" : {"mode": "chat", "provider": "azure", "base_model": "claude-opus-4-8", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "claude-opus-4-8@default" : {"mode": "chat", "provider": "vertex", "base_model": "claude-opus-4-8", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "claude-opus-4.5" : {"mode": "chat", "provider": "github_copilot", "base_model": "claude-opus-4-5", "max_input_tokens": 200000, "max_output_tokens": 32000}, "claude-opus-4.6-fast" : {"mode": "chat", "provider": "github_copilot", "base_model": "claude-opus-4-6-fast", "max_input_tokens": 128000, "max_output_tokens": 16000}, "claude-opus-4.7" : {"mode": "chat", "provider": "github_copilot", "base_model": "claude-opus-4-7", "max_input_tokens": 200000, "max_output_tokens": 64000}, "claude-opus-41" : {"mode": "chat", "provider": "github_copilot", "base_model": "claude-opus-4-1", "max_input_tokens": 80000, "max_output_tokens": 16000}, "claude-opus-4@20250514" : {"mode": "chat", "provider": "vertex", "base_model": "claude-opus-4", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "claude-sonnet-4" : {"mode": "chat", "provider": "vertex", "base_model": "claude-sonnet-4", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "claude-sonnet-4-20250514" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-sonnet-4", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_creation_input_token_cost_above_1hr": 0.000006, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "claude-sonnet-4-5" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "claude-sonnet-4-5-20250929" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "claude-sonnet-4-5@20250929" : {"mode": "chat", "provider": "vertex", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "input_cost_per_token_batches": 0.0000015, "output_cost_per_token_batches": 0.0000075, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "claude-sonnet-4-6" : {"mode": "chat", "provider": "anthropic", "base_model": "claude-sonnet-4-6", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "claude-sonnet-4-6@default" : {"mode": "chat", "provider": "vertex", "base_model": "claude-sonnet-4-6", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "claude-sonnet-4.5" : {"mode": "chat", "provider": "github_copilot", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 32000}, "claude-sonnet-4.6" : {"mode": "chat", "provider": "github_copilot", "base_model": "claude-sonnet-4-6", "max_input_tokens": 200000, "max_output_tokens": 32000}, "claude-sonnet-4@20250514" : {"mode": "chat", "provider": "vertex", "base_model": "claude-sonnet-4", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "codegeex4" : {"mode": "chat", "provider": "ollama", "base_model": "codegeex4", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "codegemma" : {"mode": "completion", "provider": "ollama", "base_model": "codegemma", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "codellama" : {"mode": "completion", "provider": "ollama", "base_model": "codellama", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "codellama-34b-instruct" : {"mode": "chat", "provider": "perplexity", "base_model": "codellama-34b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.0000014}, "codellama-70b-instruct" : {"mode": "chat", "provider": "perplexity", "base_model": "codellama-70b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000028}, "codellama-7b" : {"mode": "chat", "provider": "llamagate", "base_model": "codellama-7b", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000012}, "codellama/CodeLlama-34b-Instruct-hf" : {"mode": "chat", "provider": "anyscale", "base_model": "codellama-34b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001}, "codellama/CodeLlama-70b-Instruct-hf" : {"mode": "chat", "provider": "anyscale", "base_model": "codellama-70b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001}, "codestral-2" : {"mode": "chat", "provider": "vertex", "base_model": "codestral-2", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000009}, "codestral-2405" : {"mode": "chat", "provider": "mistral", "base_model": "codestral", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "codestral-2501" : {"mode": "chat", "provider": "vertex", "base_model": "codestral", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "codestral-2508" : {"mode": "chat", "provider": "mistral", "base_model": "codestral", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000009}, "codestral-2@001" : {"mode": "chat", "provider": "vertex", "base_model": "codestral-2", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000009}, "codestral-embed" : {"mode": "embedding", "provider": "mistral", "base_model": "codestral-embed", "max_input_tokens": 8192, "input_cost_per_token": 0.00000015}, "codestral-embed-2505" : {"mode": "embedding", "provider": "mistral", "base_model": "codestral-embed", "max_input_tokens": 8192, "input_cost_per_token": 0.00000015}, "codestral-latest" : {"mode": "chat", "provider": "mistral", "base_model": "codestral", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "codestral-mamba-latest" : {"mode": "chat", "provider": "mistral", "base_model": "codestral-mamba", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025}, "codestral@2405" : {"mode": "chat", "provider": "vertex", "base_model": "codestral", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "codestral@latest" : {"mode": "chat", "provider": "vertex", "base_model": "codestral", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "codex-auto-review" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.4", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000015, "input_cost_per_token_flex": 0.00000125, "output_cost_per_token_flex": 0.0000075, "cache_read_input_token_cost": 0.00000025, "input_cost_per_token_batches": 0.00000125, "input_cost_per_token_priority": 0.000005, "output_cost_per_token_batches": 0.0000075, "output_cost_per_token_priority": 0.00003, "cache_read_input_token_cost_flex": 0.00000013, "cache_read_input_token_cost_priority": 0.0000005, "input_cost_per_token_above_272k_tokens": 0.000005, "output_cost_per_token_above_272k_tokens": 0.0000225, "cache_read_input_token_cost_above_272k_tokens": 0.0000005}, "codex-mini" : {"mode": "responses", "provider": "azure", "base_model": "codex-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.000000375}, "codex-mini-latest" : {"mode": "responses", "provider": "openai", "base_model": "codex-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.000000375}, "cohere-rerank-v3-english" : {"mode": "rerank", "provider": "azure", "base_model": "rerank-v3-english", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "cohere-rerank-v3-multilingual" : {"mode": "rerank", "provider": "azure", "base_model": "rerank-v3-multilingual", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "cohere-rerank-v3.5" : {"mode": "rerank", "provider": "azure", "base_model": "rerank", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "cohere-rerank-v4.0-fast" : {"mode": "rerank", "provider": "azure", "base_model": "rerank-v4.0-fast", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "cohere-rerank-v4.0-pro" : {"mode": "rerank", "provider": "azure", "base_model": "rerank-v4.0-pro", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "cohere.command-a-03-2025" : {"mode": "chat", "provider": "oci", "base_model": "command-a", "max_input_tokens": 256000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000156, "output_cost_per_token": 0.00000156}, "cohere.command-a-reasoning-08-2025" : {"mode": "chat", "provider": "oci", "base_model": "command-a", "max_input_tokens": 256000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000156, "output_cost_per_token": 0.00000156}, "cohere.command-a-translate-08-2025" : {"mode": "chat", "provider": "oci", "base_model": "command-a-translate", "max_input_tokens": 256000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000009, "output_cost_per_token": 0.00000009}, "cohere.command-a-vision-07-2025" : {"mode": "chat", "provider": "oci", "base_model": "command-a-vision", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000156, "output_cost_per_token": 0.00000156}, "cohere.command-latest" : {"mode": "chat", "provider": "oci", "base_model": "command", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000156, "output_cost_per_token": 0.00000156}, "cohere.command-light-text-v14" : {"mode": "chat", "provider": "bedrock", "base_model": "command-light-text-v14", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006}, "cohere.command-plus-latest" : {"mode": "chat", "provider": "oci", "base_model": "command-plus", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000156, "output_cost_per_token": 0.00000156}, "cohere.command-r-08-2024" : {"mode": "chat", "provider": "oci", "base_model": "command-r", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "cohere.command-r-plus-08-2024" : {"mode": "chat", "provider": "oci", "base_model": "command-r-plus", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000156, "output_cost_per_token": 0.00000156}, "cohere.command-r-plus-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "command-r-plus", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "cohere.command-r-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "command-r", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "cohere.command-text-v14" : {"mode": "chat", "provider": "bedrock", "base_model": "command-text-v14", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002}, "cohere.embed-english-image-v3.0" : {"mode": "embedding", "provider": "oci", "base_model": "embed-english-image", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "cohere.embed-english-light-image-v3.0" : {"mode": "embedding", "provider": "oci", "base_model": "embed-english-light-image", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "cohere.embed-english-light-v3.0" : {"mode": "embedding", "provider": "oci", "base_model": "embed-english-light", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "cohere.embed-english-v3" : {"mode": "embedding", "provider": "bedrock", "base_model": "embed-english-v3", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "cohere.embed-english-v3.0" : {"mode": "embedding", "provider": "oci", "base_model": "embed-english", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "cohere.embed-multilingual-light-image-v3.0" : {"mode": "embedding", "provider": "oci", "base_model": "embed-multilingual-light-image", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "cohere.embed-multilingual-light-v3.0" : {"mode": "embedding", "provider": "oci", "base_model": "embed-multilingual-light", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "cohere.embed-multilingual-v3" : {"mode": "embedding", "provider": "bedrock", "base_model": "embed-multilingual-v3", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "cohere.embed-multilingual-v3.0" : {"mode": "embedding", "provider": "oci", "base_model": "embed-multilingual", "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "cohere.embed-v4.0" : {"mode": "embedding", "provider": "oci", "base_model": "embed", "max_input_tokens": 128000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "cohere.embed-v4:0" : {"mode": "embedding", "provider": "bedrock", "base_model": "embed", "max_input_tokens": 128000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "cohere.rerank-v3-5:0" : {"mode": "rerank", "provider": "bedrock", "base_model": "rerank-v3-5", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "cohere/command-a" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "command-a", "max_input_tokens": 256000, "max_output_tokens": 8000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "cohere/command-r" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "command-r", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "cohere/command-r-08-2024" : {"mode": "chat", "provider": "openrouter", "base_model": "command-r-08-2024", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "cohere/command-r-plus" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "command-r-plus", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "cohere/command-r-plus-08-2024" : {"mode": "chat", "provider": "openrouter", "base_model": "command-r-plus-08-2024", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "cohere/command-r7b-12-2024" : {"mode": "chat", "provider": "openrouter", "base_model": "command-r7b-12-2024", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000000375, "output_cost_per_token": 0.00000015}, "cohere/embed-v4.0" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "embed", "max_input_tokens": 0, "max_output_tokens": 0, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "command" : {"mode": "completion", "provider": "cohere", "base_model": "command", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000002}, "command-a-03-2025" : {"mode": "chat", "provider": "cohere", "base_model": "command-a", "max_input_tokens": 256000, "max_output_tokens": 8000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "command-light" : {"mode": "chat", "provider": "cohere", "base_model": "command-light", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006}, "command-nightly" : {"mode": "completion", "provider": "cohere", "base_model": "command-nightly", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000002}, "command-r" : {"mode": "chat", "provider": "cohere", "base_model": "command-r", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "command-r-08-2024" : {"mode": "chat", "provider": "cohere", "base_model": "command-r", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "command-r-plus" : {"mode": "chat", "provider": "azure", "base_model": "command-r-plus", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "command-r-plus-08-2024" : {"mode": "chat", "provider": "cohere", "base_model": "command-r-plus", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "command-r7b-12-2024" : {"mode": "chat", "provider": "cohere", "base_model": "command-r7b", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000000375}, "computer-use-preview" : {"mode": "chat", "provider": "azure", "base_model": "computer-use", "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000012}, "conservative" : {"mode": "image_edit", "provider": "stability", "base_model": "conservative", "output_cost_per_image": 0.04}, "container" : {"mode": "chat", "provider": "openai", "base_model": "container", "code_interpreter_cost_per_session": 0.03}, "container-16g" : {"mode": "chat", "provider": "openai", "base_model": "container", "code_interpreter_cost_per_session": 0.48}, "container-1g" : {"mode": "chat", "provider": "openai", "base_model": "container", "code_interpreter_cost_per_session": 0.03}, "container-4g" : {"mode": "chat", "provider": "openai", "base_model": "container", "code_interpreter_cost_per_session": 0.12}, "container-64g" : {"mode": "chat", "provider": "openai", "base_model": "container", "code_interpreter_cost_per_session": 1.92}, "core42/jais-13b-chat" : {"mode": "chat", "provider": "watsonx", "base_model": "jais-13b-chat", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0005, "output_cost_per_token": 0.002}, "creative" : {"mode": "image_edit", "provider": "stability", "base_model": "creative", "output_cost_per_image": 0.06}, "dall-e-2" : {"mode": "image_generation", "provider": "openai", "base_model": "dall-e-2", "input_cost_per_image": 0.02, "input_cost_per_pixel": 0.000000019, "output_cost_per_pixel": 0}, "dall-e-3" : {"mode": "image_generation", "provider": "aiml", "base_model": "dall-e-3", "output_cost_per_image": 0.052}, "databricks-bge-large-en" : {"mode": "embedding", "provider": "databricks", "base_model": "bge-large-en", "max_input_tokens": 512, "input_cost_per_token": 0.00000010003, "output_cost_per_token": 0}, "databricks-claude-3-7-sonnet" : {"mode": "chat", "provider": "databricks", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000029999900000000002, "output_cost_per_token": 0.000015000020000000002}, "databricks-claude-haiku-4-5" : {"mode": "chat", "provider": "databricks", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.00000100002, "output_cost_per_token": 0.00000500003}, "databricks-claude-opus-4" : {"mode": "chat", "provider": "databricks", "base_model": "claude-opus-4", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015000020000000002, "output_cost_per_token": 0.00007500003000000001}, "databricks-claude-opus-4-1" : {"mode": "chat", "provider": "databricks", "base_model": "claude-opus-4-1", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015000020000000002, "output_cost_per_token": 0.00007500003000000001}, "databricks-claude-opus-4-5" : {"mode": "chat", "provider": "databricks", "base_model": "claude-opus-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.00000500003, "output_cost_per_token": 0.000025000010000000002}, "databricks-claude-opus-4-6" : {"mode": "chat", "provider": "databricks", "base_model": "claude-opus-4-6", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.00000500003, "output_cost_per_token": 0.000025000010000000002}, "databricks-claude-opus-4-7" : {"mode": "chat", "provider": "databricks", "base_model": "claude-opus-4-7", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.00000500003, "output_cost_per_token": 0.000025000010000000002}, "databricks-claude-opus-4-8" : {"mode": "chat", "provider": "databricks", "base_model": "claude-opus-4-8", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000500003, "output_cost_per_token": 0.000025000010000000002}, "databricks-claude-sonnet-4" : {"mode": "chat", "provider": "databricks", "base_model": "claude-sonnet-4", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000029999900000000002, "output_cost_per_token": 0.000015000020000000002}, "databricks-claude-sonnet-4-1" : {"mode": "chat", "provider": "databricks", "base_model": "claude-sonnet-4-1", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000029999900000000002, "output_cost_per_token": 0.000015000020000000002}, "databricks-claude-sonnet-4-5" : {"mode": "chat", "provider": "databricks", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000029999900000000002, "output_cost_per_token": 0.000015000020000000002}, "databricks-claude-sonnet-4-6" : {"mode": "chat", "provider": "databricks", "base_model": "claude-sonnet-4-6", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000029999900000000002, "output_cost_per_token": 0.000015000020000000002}, "databricks-gemini-2-5-flash" : {"mode": "chat", "provider": "databricks", "base_model": "gemini-2.5-flash", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.00000030001999999999996, "output_cost_per_token": 0.00000249998}, "databricks-gemini-2-5-pro" : {"mode": "chat", "provider": "databricks", "base_model": "gemini-2.5-pro", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.00000124999, "output_cost_per_token": 0.000009999990000000002}, "databricks-gemma-3-12b" : {"mode": "chat", "provider": "databricks", "base_model": "gemma-3-12b", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000015000999999999998, "output_cost_per_token": 0.00000050001}, "databricks-gpt-5" : {"mode": "chat", "provider": "databricks", "base_model": "gpt-5", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000124999, "output_cost_per_token": 0.000009999990000000002}, "databricks-gpt-5-1" : {"mode": "chat", "provider": "databricks", "base_model": "gpt-5-1", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000124999, "output_cost_per_token": 0.000009999990000000002}, "databricks-gpt-5-mini" : {"mode": "chat", "provider": "databricks", "base_model": "gpt-5-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000024997000000000006, "output_cost_per_token": 0.0000019999700000000004}, "databricks-gpt-5-nano" : {"mode": "chat", "provider": "databricks", "base_model": "gpt-5-nano", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000004998, "output_cost_per_token": 0.00000039998000000000007}, "databricks-gpt-oss-120b" : {"mode": "chat", "provider": "databricks", "base_model": "gpt-oss-120b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000015000999999999998, "output_cost_per_token": 0.00000059997}, "databricks-gpt-oss-20b" : {"mode": "chat", "provider": "databricks", "base_model": "gpt-oss-20b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000030001999999999996}, "databricks-gte-large-en" : {"mode": "embedding", "provider": "databricks", "base_model": "gte-large-en", "max_input_tokens": 8192, "input_cost_per_token": 0.00000012999000000000001, "output_cost_per_token": 0}, "databricks-llama-2-70b-chat" : {"mode": "chat", "provider": "databricks", "base_model": "llama-2-70b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000050001, "output_cost_per_token": 0.0000015000300000000002}, "databricks-llama-4-maverick" : {"mode": "chat", "provider": "databricks", "base_model": "llama-4-maverick", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000050001, "output_cost_per_token": 0.0000015000300000000002}, "databricks-meta-llama-3-1-405b-instruct" : {"mode": "chat", "provider": "databricks", "base_model": "llama-3-1-405b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000500003, "output_cost_per_token": 0.000015000020000000002}, "databricks-meta-llama-3-1-8b-instruct" : {"mode": "chat", "provider": "databricks", "base_model": "llama-3-1-8b-instruct", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000015000999999999998, "output_cost_per_token": 0.00000045003000000000007}, "databricks-meta-llama-3-3-70b-instruct" : {"mode": "chat", "provider": "databricks", "base_model": "llama-3-3-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000050001, "output_cost_per_token": 0.0000015000300000000002}, "databricks-meta-llama-3-70b-instruct" : {"mode": "chat", "provider": "databricks", "base_model": "llama-3-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000100002, "output_cost_per_token": 0.0000029999900000000002}, "databricks-mixtral-8x7b-instruct" : {"mode": "chat", "provider": "databricks", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000050001, "output_cost_per_token": 0.00000100002}, "databricks-mpt-30b-instruct" : {"mode": "chat", "provider": "databricks", "base_model": "mpt-30b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000100002, "output_cost_per_token": 0.00000100002}, "databricks-mpt-7b-instruct" : {"mode": "chat", "provider": "databricks", "base_model": "mpt-7b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000050001, "output_cost_per_token": 0}, "davinci-002" : {"mode": "completion", "provider": "text-completion-openai", "base_model": "davinci-002", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002}, "deep-research-pro-preview-12-2025" : {"mode": "image_generation", "provider": "vertex", "base_model": "deep-research-pro", "max_input_tokens": 65536, "max_output_tokens": 32768, "input_cost_per_image": 0.0011, "input_cost_per_token": 0.000002, "output_cost_per_image": 0.134, "output_cost_per_token": 0.000012, "output_cost_per_image_token": 0.00012, "input_cost_per_token_batches": 0.000001, "output_cost_per_token_batches": 0.000006}, "deepcogito/cogito-v2.1-671b" : {"mode": "chat", "provider": "openrouter", "base_model": "cogito-v2.1-671b", "max_input_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00000125}, "deepseek-ai/DeepSeek-R1" : {"mode": "chat", "provider": "deepinfra", "base_model": "deepseek-r1", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000024}, "deepseek-ai/DeepSeek-R1-0528" : {"mode": "chat", "provider": "crusoe", "base_model": "deepseek-r1", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000007}, "deepseek-ai/DeepSeek-R1-0528-Turbo" : {"mode": "chat", "provider": "deepinfra", "base_model": "deepseek-r1-0528-turbo", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "deepseek-ai/DeepSeek-R1-0528-tput" : {"mode": "chat", "provider": "together_ai", "base_model": "deepseek-r1", "max_input_tokens": 128000, "input_cost_per_token": 0.00000055, "output_cost_per_token": 0.00000219}, "deepseek-ai/DeepSeek-R1-Distill-Llama-70B" : {"mode": "chat", "provider": "nebius", "base_model": "deepseek-r1-distill-llama-70b", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000075}, "deepseek-ai/DeepSeek-R1-Distill-Llama-8B" : {"mode": "chat", "provider": "nscale", "base_model": "deepseek-r1-distill-llama-8b", "input_cost_per_token": 0.000000025, "output_cost_per_token": 0.000000025}, "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B" : {"mode": "chat", "provider": "nscale", "base_model": "deepseek-r1-distill-qwen-1.5b", "input_cost_per_token": 0.00000009, "output_cost_per_token": 0.00000009}, "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B" : {"mode": "chat", "provider": "nscale", "base_model": "deepseek-r1-distill-qwen-14b", "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000007}, "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B" : {"mode": "chat", "provider": "deepinfra", "base_model": "deepseek-r1-distill-qwen-32b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.00000027}, "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B" : {"mode": "chat", "provider": "nscale", "base_model": "deepseek-r1-distill-qwen-7b", "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "deepseek-ai/DeepSeek-R1-Turbo" : {"mode": "chat", "provider": "deepinfra", "base_model": "deepseek-r1-turbo", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "deepseek-ai/DeepSeek-V3" : {"mode": "chat", "provider": "together_ai", "base_model": "deepseek-v3", "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00000125}, "deepseek-ai/DeepSeek-V3-0324" : {"mode": "chat", "provider": "baseten", "base_model": "deepseek-v3", "input_cost_per_token": 0.00000077, "output_cost_per_token": 0.00000077}, "deepseek-ai/DeepSeek-V3.1" : {"mode": "chat", "provider": "baseten", "base_model": "deepseek-v3.1", "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "deepseek-ai/DeepSeek-V3.1-Terminus" : {"mode": "chat", "provider": "deepinfra", "base_model": "deepseek-v3.1-terminus", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.000001, "cache_read_input_token_cost": 0.000000216}, "deepseek-ai/DeepSeek-V3.2" : {"mode": "chat", "provider": "gmi", "base_model": "deepseek-v3.2", "max_input_tokens": 163840, "max_output_tokens": 16384, "input_cost_per_token": 0.00000028, "output_cost_per_token": 0.0000004}, "deepseek-ai/deepseek-ocr-maas" : {"mode": "ocr", "provider": "vertex", "base_model": "deepseek-ocr", "ocr_cost_per_page": 0.0003, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "deepseek-ai/deepseek-r1" : {"mode": "chat", "provider": "replicate", "base_model": "deepseek-r1", "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.00000375, "output_cost_per_token": 0.00001}, "deepseek-ai/deepseek-r1-0528-maas" : {"mode": "chat", "provider": "vertex", "base_model": "deepseek-r1", "max_input_tokens": 65336, "max_output_tokens": 8192, "input_cost_per_token": 0.00000135, "output_cost_per_token": 0.0000054}, "deepseek-ai/deepseek-v3" : {"mode": "chat", "provider": "replicate", "base_model": "deepseek-v3", "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.00000145, "output_cost_per_token": 0.00000145}, "deepseek-ai/deepseek-v3.1" : {"mode": "chat", "provider": "replicate", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.000000672, "output_cost_per_token": 0.000002016}, "deepseek-ai/deepseek-v3.1-maas" : {"mode": "chat", "provider": "vertex", "base_model": "deepseek-v3.1", "max_input_tokens": 163840, "max_output_tokens": 32768, "input_cost_per_token": 0.00000135, "output_cost_per_token": 0.0000054}, "deepseek-ai/deepseek-v3.2-maas" : {"mode": "chat", "provider": "vertex", "base_model": "deepseek-v3.2", "max_input_tokens": 163840, "max_output_tokens": 32768, "input_cost_per_token": 0.00000056, "output_cost_per_token": 0.00000168, "input_cost_per_token_batches": 0.00000028, "output_cost_per_token_batches": 0.00000084}, "deepseek-chat" : {"mode": "chat", "provider": "deepseek", "base_model": "deepseek-chat", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0.00000028, "output_cost_per_token": 0.00000042, "cache_read_input_token_cost": 0.000000028, "cache_creation_input_token_cost": 0}, "deepseek-coder" : {"mode": "chat", "provider": "deepseek", "base_model": "deepseek-coder", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.00000028}, "deepseek-coder-6.7b" : {"mode": "chat", "provider": "llamagate", "base_model": "deepseek-coder-6.7b", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000012}, "deepseek-coder-v2-base" : {"mode": "completion", "provider": "ollama", "base_model": "deepseek-coder-v2-base", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "deepseek-coder-v2-instruct" : {"mode": "chat", "provider": "ollama", "base_model": "deepseek-coder-v2-instruct", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "deepseek-coder-v2-lite-base" : {"mode": "completion", "provider": "ollama", "base_model": "deepseek-coder-v2-lite-base", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "deepseek-coder-v2-lite-instruct" : {"mode": "chat", "provider": "ollama", "base_model": "deepseek-coder-v2-lite-instruct", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "deepseek-llama3.3-70b" : {"mode": "chat", "provider": "lambda_ai", "base_model": "deepseek-llama3.3-70b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "deepseek-r1" : {"mode": "chat", "provider": "azure", "base_model": "deepseek-r1", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000135, "output_cost_per_token": 0.0000054}, "deepseek-r1-0528" : {"mode": "chat", "provider": "lambda_ai", "base_model": "deepseek-r1", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "deepseek-r1-671b" : {"mode": "chat", "provider": "lambda_ai", "base_model": "deepseek-r1-671b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000008}, "deepseek-r1-7b-qwen" : {"mode": "chat", "provider": "llamagate", "base_model": "deepseek-r1-7b-qwen", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000015}, "deepseek-r1-8b" : {"mode": "chat", "provider": "llamagate", "base_model": "deepseek-r1-8b", "max_input_tokens": 65536, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000002}, "deepseek-r1-distill-llama-70b" : {"mode": "chat", "provider": "gradient_ai", "base_model": "deepseek-r1-distill-llama-70b", "max_input_tokens": 32768, "max_output_tokens": 8000, "input_cost_per_token": 0.00000099, "output_cost_per_token": 0.00000099}, "deepseek-reasoner" : {"mode": "chat", "provider": "deepseek", "base_model": "deepseek-r1", "max_input_tokens": 131072, "max_output_tokens": 65536, "input_cost_per_token": 0.00000028, "output_cost_per_token": 0.00000042, "cache_read_input_token_cost": 0.000000028}, "deepseek-v3" : {"mode": "chat", "provider": "azure", "base_model": "deepseek-v3", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000114, "output_cost_per_token": 0.00000456}, "deepseek-v3-0324" : {"mode": "chat", "provider": "lambda_ai", "base_model": "deepseek-v3", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "deepseek-v3-2-251201" : {"mode": "chat", "provider": "volcengine", "base_model": "deepseek-v3-2", "max_input_tokens": 98304, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "deepseek-v3.1:671b-cloud" : {"mode": "chat", "provider": "ollama", "base_model": "deepseek-v3.1-671b", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0, "output_cost_per_token": 0}, "deepseek-v3.2" : {"mode": "chat", "provider": "deepseek", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000028, "output_cost_per_token": 0.0000004}, "deepseek-v3.2-speciale" : {"mode": "chat", "provider": "azure", "base_model": "deepseek-v3.2", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000058, "output_cost_per_token": 0.00000168}, "deepseek.v3-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek-v3", "max_input_tokens": 163840, "max_output_tokens": 81920, "input_cost_per_token": 0.00000058, "output_cost_per_token": 0.00000168}, "deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000062, "output_cost_per_token": 0.00000185}, "deepseek/deepseek-chat" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-chat", "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.00000028}, "deepseek/deepseek-chat-v3-0324" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-chat-v3", "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.00000028, "cache_read_input_token_cost": 0.000000135}, "deepseek/deepseek-chat-v3.1" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-chat", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000008, "cache_read_input_token_cost": 0.00000013}, "deepseek/deepseek-ocr" : {"mode": "chat", "provider": "novita", "base_model": "deepseek-ocr", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000003, "output_cost_per_token": 0.00000003}, "deepseek/deepseek-prover-v2-671b" : {"mode": "chat", "provider": "novita", "base_model": "deepseek-prover-v2-671b", "max_input_tokens": 160000, "max_output_tokens": 160000, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000025}, "deepseek/deepseek-r1" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-r1", "max_input_tokens": 65336, "max_output_tokens": 8192, "input_cost_per_token": 0.00000055, "output_cost_per_token": 0.00000219}, "deepseek/deepseek-r1-0528" : {"mode": "chat", "provider": "novita", "base_model": "deepseek-r1", "max_input_tokens": 163840, "max_output_tokens": 32768, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.00000035}, "deepseek/deepseek-r1-0528-qwen3-8b" : {"mode": "chat", "provider": "novita", "base_model": "deepseek-r1-0528-qwen3-8b", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000009}, "deepseek/deepseek-r1-distill-llama-70b" : {"mode": "chat", "provider": "novita", "base_model": "deepseek-r1-distill-llama-70b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000008}, "deepseek/deepseek-r1-distill-qwen-14b" : {"mode": "chat", "provider": "novita", "base_model": "deepseek-r1-distill-qwen-14b", "max_input_tokens": 32768, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "deepseek/deepseek-r1-distill-qwen-32b" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-r1-distill-qwen-32b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000029, "output_cost_per_token": 0.00000029}, "deepseek/deepseek-r1-turbo" : {"mode": "chat", "provider": "novita", "base_model": "deepseek-r1-turbo", "max_input_tokens": 64000, "max_output_tokens": 16000, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000025}, "deepseek/deepseek-v3" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "deepseek-v3", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "deepseek/deepseek-v3-0324" : {"mode": "chat", "provider": "novita", "base_model": "deepseek-v3", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.00000112, "cache_read_input_token_cost": 0.000000135}, "deepseek/deepseek-v3-turbo" : {"mode": "chat", "provider": "novita", "base_model": "deepseek-v3-turbo", "max_input_tokens": 64000, "max_output_tokens": 16000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000013}, "deepseek/deepseek-v3.1" : {"mode": "chat", "provider": "novita", "base_model": "deepseek", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.000001, "cache_read_input_token_cost": 0.000000135}, "deepseek/deepseek-v3.1-terminus" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-v3.1-terminus", "max_input_tokens": 163840, "max_output_tokens": 32768, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.00000095, "cache_read_input_token_cost": 0.00000013}, "deepseek/deepseek-v3.2" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000028, "output_cost_per_token": 0.0000004}, "deepseek/deepseek-v3.2-exp" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-v3.2", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004}, "deepseek/deepseek-v4-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-v4-flash", "max_input_tokens": 1048576, "max_output_tokens": 131072, "input_cost_per_token": 0.0000000983, "output_cost_per_token": 0.0000001966, "cache_read_input_token_cost": 0.0000000197}, "deepseek/deepseek-v4-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-v4-pro", "max_input_tokens": 1048576, "max_output_tokens": 384000, "input_cost_per_token": 0.000000435, "output_cost_per_token": 0.00000087, "cache_read_input_token_cost": 0.000000003625}, "devstral-2512" : {"mode": "chat", "provider": "mistral", "base_model": "devstral", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "devstral-latest" : {"mode": "chat", "provider": "mistral", "base_model": "devstral", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "devstral-medium-2507" : {"mode": "chat", "provider": "mistral", "base_model": "devstral-medium", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "devstral-medium-latest" : {"mode": "chat", "provider": "mistral", "base_model": "devstral-medium", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "devstral-small-2505" : {"mode": "chat", "provider": "mistral", "base_model": "devstral-small", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "devstral-small-2507" : {"mode": "chat", "provider": "mistral", "base_model": "devstral-small", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "devstral-small-latest" : {"mode": "chat", "provider": "mistral", "base_model": "devstral-small", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "doc-intelligence/prebuilt-document" : {"mode": "ocr", "provider": "azure", "base_model": "doc-intelligence/prebuilt-document", "ocr_cost_per_page": 0.01}, "doc-intelligence/prebuilt-layout" : {"mode": "ocr", "provider": "azure", "base_model": "doc-intelligence/prebuilt-layout", "ocr_cost_per_page": 0.01}, "doc-intelligence/prebuilt-read" : {"mode": "ocr", "provider": "azure", "base_model": "doc-intelligence/prebuilt-read", "ocr_cost_per_page": 0.0015}, "dolphin" : {"mode": "completion", "provider": "nlp_cloud", "base_model": "dolphin", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "dolphin3-8b" : {"mode": "chat", "provider": "llamagate", "base_model": "dolphin3-8b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000015}, "doubao-embedding" : {"mode": "embedding", "provider": "volcengine", "base_model": "doubao-embedding", "max_input_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "doubao-embedding-large" : {"mode": "embedding", "provider": "volcengine", "base_model": "doubao-embedding-large", "max_input_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "doubao-embedding-large-text-240915" : {"mode": "embedding", "provider": "volcengine", "base_model": "doubao-embedding-large-text", "max_input_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "doubao-embedding-large-text-250515" : {"mode": "embedding", "provider": "volcengine", "base_model": "doubao-embedding-large-text", "max_input_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "doubao-embedding-text-240715" : {"mode": "embedding", "provider": "volcengine", "base_model": "doubao-embedding-text", "max_input_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "doubao-seed-2-0-code-preview-260215" : {"mode": "chat", "provider": "volcengine", "base_model": "doubao-seed-2-0-code", "max_input_tokens": 256000, "max_output_tokens": 128000}, "doubao-seed-2-0-lite-260215" : {"mode": "chat", "provider": "volcengine", "base_model": "doubao-seed-2-0-lite", "max_input_tokens": 256000, "max_output_tokens": 128000}, "doubao-seed-2-0-mini-260215" : {"mode": "chat", "provider": "volcengine", "base_model": "doubao-seed-2-0-mini", "max_input_tokens": 256000, "max_output_tokens": 128000}, "doubao-seed-2-0-pro-260215" : {"mode": "chat", "provider": "volcengine", "base_model": "doubao-seed-2-0-pro", "max_input_tokens": 256000, "max_output_tokens": 128000}, "eleven_multilingual_v2" : {"mode": "audio_speech", "provider": "elevenlabs", "base_model": "eleven-multilingual-v2", "input_cost_per_character": 0.00018}, "eleven_v3" : {"mode": "audio_speech", "provider": "elevenlabs", "base_model": "eleven-v3", "input_cost_per_character": 0.00018}, "embed-english-light-v2.0" : {"mode": "embedding", "provider": "cohere", "base_model": "embed-english-light", "max_input_tokens": 1024, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "embed-english-light-v3.0" : {"mode": "embedding", "provider": "cohere", "base_model": "embed-english-light", "max_input_tokens": 1024, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "embed-english-v2.0" : {"mode": "embedding", "provider": "cohere", "base_model": "embed-english", "max_input_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "embed-english-v3.0" : {"mode": "embedding", "provider": "cohere", "base_model": "embed-english", "max_input_tokens": 1024, "input_cost_per_image": 0.0001, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "embed-multilingual-light-v3.0" : {"mode": "embedding", "provider": "cohere", "base_model": "embed-multilingual-light", "max_input_tokens": 1024, "input_cost_per_token": 0.0001, "output_cost_per_token": 0}, "embed-multilingual-v2.0" : {"mode": "embedding", "provider": "cohere", "base_model": "embed-multilingual", "max_input_tokens": 768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "embed-multilingual-v3.0" : {"mode": "embedding", "provider": "cohere", "base_model": "embed-multilingual", "max_input_tokens": 1024, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "embed-v-4-0" : {"mode": "embedding", "provider": "azure", "base_model": "embed-v-4-0", "max_input_tokens": 128000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "embed-v4.0" : {"mode": "embedding", "provider": "cohere", "base_model": "embed", "max_input_tokens": 128000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "enhanced" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "enhanced", "input_cost_per_second": 0.00024167, "output_cost_per_second": 0}, "enhanced-finance" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "enhanced-finance", "input_cost_per_second": 0.00024167, "output_cost_per_second": 0}, "enhanced-general" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "enhanced-general", "input_cost_per_second": 0.00024167, "output_cost_per_second": 0}, "enhanced-meeting" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "enhanced-meeting", "input_cost_per_second": 0.00024167, "output_cost_per_second": 0}, "enhanced-phonecall" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "enhanced-phonecall", "input_cost_per_second": 0.00024167, "output_cost_per_second": 0}, "erase" : {"mode": "image_edit", "provider": "stability", "base_model": "erase", "output_cost_per_image": 0.005}, "essentialai/rnj-1-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "rnj-1-instruct", "max_input_tokens": 32768, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "eu-central-1/1-month-commitment/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.01635, "output_cost_per_second": 0.01635}, "eu-central-1/1-month-commitment/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0415, "output_cost_per_second": 0.0415}, "eu-central-1/1-month-commitment/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0415, "output_cost_per_second": 0.0415}, "eu-central-1/6-month-commitment/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.009083, "output_cost_per_second": 0.009083}, "eu-central-1/6-month-commitment/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02305, "output_cost_per_second": 0.02305}, "eu-central-1/6-month-commitment/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02305, "output_cost_per_second": 0.02305}, "eu-central-1/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000248, "output_cost_per_token": 0.00000838}, "eu-central-1/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "eu-central-1/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "eu-central-1/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "eu-central-1/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "eu-central-1/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.00000144}, "eu-north-1/deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000074, "output_cost_per_token": 0.00000222}, "eu-north-1/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "eu-north-1/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "eu-north-1/moonshotai.kimi-k2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.0000036}, "eu-south-1/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "eu-south-1/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "eu-south-1/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.00000144}, "eu-west-1/meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000286, "output_cost_per_token": 0.00000378}, "eu-west-1/meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000032, "output_cost_per_token": 0.00000065}, "eu-west-1/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "eu-west-1/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "eu-west-1/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.00000144}, "eu-west-2/meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000345, "output_cost_per_token": 0.00000455}, "eu-west-2/meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000039, "output_cost_per_token": 0.00000078}, "eu-west-2/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000047, "output_cost_per_token": 0.00000186}, "eu-west-2/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000047, "output_cost_per_token": 0.00000186}, "eu-west-2/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.00000078, "output_cost_per_token": 0.00000186}, "eu-west-3/mistral.mistral-7b-instruct-v0:2" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.00000026}, "eu-west-3/mistral.mistral-large-2402-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-large", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000104, "output_cost_per_token": 0.0000312}, "eu-west-3/mistral.mixtral-8x7b-instruct-v0:1" : {"mode": "chat", "provider": "bedrock", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000091}, "eu.amazon.nova-2-lite-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-2-lite", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.00000033, "output_cost_per_token": 0.00000275, "cache_read_input_token_cost": 0.0000000825}, "eu.amazon.nova-2-pro-preview-20251202-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-2-pro", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000021875, "output_cost_per_token": 0.0000175, "input_cost_per_audio_token": 0.0000021875, "input_cost_per_image_token": 0.0000021875, "cache_read_input_token_cost": 0.000000546875}, "eu.amazon.nova-lite-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-lite", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.000000078, "output_cost_per_token": 0.000000312}, "eu.amazon.nova-micro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-micro", "max_input_tokens": 128000, "max_output_tokens": 10000, "input_cost_per_token": 0.000000046, "output_cost_per_token": 0.000000184}, "eu.amazon.nova-pro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-pro", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.00000105, "output_cost_per_token": 0.0000042}, "eu.anthropic.claude-3-5-haiku-20241022-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-haiku", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "cache_read_input_token_cost": 0.000000025, "cache_creation_input_token_cost": 0.0000003125}, "eu.anthropic.claude-3-5-sonnet-20240620-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "eu.anthropic.claude-3-5-sonnet-20241022-v2:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "eu.anthropic.claude-3-7-sonnet-20250219-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "eu.anthropic.claude-3-haiku-20240307-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "cache_read_input_token_cost": 0.000000025, "cache_creation_input_token_cost": 0.0000003125}, "eu.anthropic.claude-3-opus-20240229-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-opus", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "eu.anthropic.claude-3-sonnet-20240229-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "eu.anthropic.claude-haiku-4-5-20251001-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000055, "cache_read_input_token_cost": 0.00000011, "cache_creation_input_token_cost": 0.000001375}, "eu.anthropic.claude-opus-4-1-20250805-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-1", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "eu.anthropic.claude-opus-4-20250514-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "eu.anthropic.claude-opus-4-5-20251101-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "eu.anthropic.claude-opus-4-6-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-6", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.0000275, "cache_read_input_token_cost": 0.00000055, "cache_creation_input_token_cost": 0.000006875}, "eu.anthropic.claude-opus-4-7" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-7", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.0000275, "cache_read_input_token_cost": 0.00000055, "cache_creation_input_token_cost": 0.000006875}, "eu.anthropic.claude-opus-4-8" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-8", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.0000275, "cache_read_input_token_cost": 0.00000055, "cache_creation_input_token_cost": 0.000006875, "cache_creation_input_token_cost_above_1hr": 0.000011}, "eu.anthropic.claude-sonnet-4-20250514-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "eu.anthropic.claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125, "input_cost_per_token_above_200k_tokens": 0.0000066, "output_cost_per_token_above_200k_tokens": 0.00002475, "cache_read_input_token_cost_above_200k_tokens": 0.00000066, "cache_creation_input_token_cost_above_200k_tokens": 0.00000825}, "eu.anthropic.claude-sonnet-4-6" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-6", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125}, "eu.deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000074, "output_cost_per_token": 0.00000222}, "eu.meta.llama3-2-1b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-1b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000013}, "eu.meta.llama3-2-3b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-3b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000019, "output_cost_per_token": 0.00000019}, "eu.mistral.pixtral-large-2502-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "pixtral-large", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "eu.twelvelabs.marengo-embed-2-7-v1:0" : {"mode": "embedding", "provider": "bedrock", "base_model": "marengo-embed-2-7", "max_input_tokens": 77, "input_cost_per_image": 0.0001, "input_cost_per_token": 0.00007, "output_cost_per_token": 0, "input_cost_per_audio_per_second": 0.00014, "input_cost_per_video_per_second": 0.0007}, "eu.twelvelabs.pegasus-1-2-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "pegasus-1-2", "output_cost_per_token": 0.0000075, "input_cost_per_video_per_second": 0.00049}, "eu/gpt-4o-2024-08-06" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000275, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.000001375}, "eu/gpt-4o-2024-11-20" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000275, "output_cost_per_token": 0.000011, "cache_creation_input_token_cost": 0.00000138}, "eu/gpt-4o-mini-2024-07-18" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.000000165, "output_cost_per_token": 0.00000066, "cache_read_input_token_cost": 0.000000083}, "eu/gpt-4o-mini-realtime-preview-2024-12-17" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-mini-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000066, "output_cost_per_token": 0.00000264, "input_cost_per_audio_token": 0.000011, "cache_read_input_token_cost": 0.00000033, "output_cost_per_audio_token": 0.000022, "cache_creation_input_audio_token_cost": 0.00000033}, "eu/gpt-4o-realtime-preview-2024-10-01" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.000022, "input_cost_per_audio_token": 0.00011, "cache_read_input_token_cost": 0.00000275, "output_cost_per_audio_token": 0.00022, "cache_creation_input_audio_token_cost": 0.000022}, "eu/gpt-4o-realtime-preview-2024-12-17" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.000022, "input_cost_per_audio_token": 0.000044, "cache_read_input_token_cost": 0.00000275, "output_cost_per_audio_token": 0.00008}, "eu/gpt-5-2025-08-07" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000001375, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.0000001375}, "eu/gpt-5-mini-2025-08-07" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000000275, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.0000000275}, "eu/gpt-5-nano-2025-08-07" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5-nano", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000000055, "output_cost_per_token": 0.00000044, "cache_read_input_token_cost": 0.0000000055}, "eu/gpt-5.1" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.1", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000138, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.00000014}, "eu/gpt-5.1-chat" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.1-chat", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000138, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.00000014}, "eu/gpt-5.1-codex" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.1-codex", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000138, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.00000014}, "eu/gpt-5.1-codex-mini" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.1-codex-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000000275, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.000000028}, "eu/o1-2024-12-17" : {"mode": "chat", "provider": "azure", "base_model": "o1", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000165, "output_cost_per_token": 0.000066, "cache_read_input_token_cost": 0.00000825}, "eu/o1-mini-2024-09-12" : {"mode": "chat", "provider": "azure", "base_model": "o1-mini", "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.00000121, "output_cost_per_token": 0.00000484, "cache_read_input_token_cost": 0.000000605, "input_cost_per_token_batches": 0.000000605, "output_cost_per_token_batches": 0.00000242}, "eu/o1-preview-2024-09-12" : {"mode": "chat", "provider": "azure", "base_model": "o1", "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.0000165, "output_cost_per_token": 0.000066, "cache_read_input_token_cost": 0.00000825}, "eu/o3-mini-2025-01-31" : {"mode": "chat", "provider": "azure", "base_model": "o3-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00000121, "output_cost_per_token": 0.00000484, "cache_read_input_token_cost": 0.000000605, "input_cost_per_token_batches": 0.000000605, "output_cost_per_token_batches": 0.00000242}, "fal-ai/bytedance/dreamina/v3.1/text-to-image" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "dreamina/v3.1/text-to-image", "output_cost_per_image": 0.03}, "fal-ai/bytedance/seedream/v3/text-to-image" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "seedream/v3/text-to-image", "output_cost_per_image": 0.03}, "fal-ai/flux-pro/v1.1" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "flux-pro/v1.1", "output_cost_per_image": 0.04}, "fal-ai/flux-pro/v1.1-ultra" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "flux-pro/v1.1-ultra", "output_cost_per_image": 0.06}, "fal-ai/flux/schnell" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "flux/schnell", "output_cost_per_image": 0.003}, "fal-ai/ideogram/v3" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "ideogram/v3", "output_cost_per_image": 0.06}, "fal-ai/imagen4/preview" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "imagen4/preview", "output_cost_per_image": 0.0398}, "fal-ai/imagen4/preview/fast" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "imagen4/preview/fast", "output_cost_per_image": 0.02}, "fal-ai/imagen4/preview/ultra" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "imagen4/preview/ultra", "output_cost_per_image": 0.06}, "fal-ai/recraft/v3/text-to-image" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "v3/text-to-image", "output_cost_per_image": 0.0398}, "fal-ai/stable-diffusion-v35-medium" : {"mode": "image_generation", "provider": "fal_ai", "base_model": "stable-diffusion-v35-medium", "output_cost_per_image": 0.0398}, "fast" : {"mode": "image_edit", "provider": "stability", "base_model": "fast", "output_cost_per_image": 0.002}, "featherless-ai/Qwerky-72B" : {"mode": "chat", "provider": "featherless_ai", "base_model": "qwerky-72b", "max_input_tokens": 32768, "max_output_tokens": 4096}, "featherless-ai/Qwerky-QwQ-32B" : {"mode": "chat", "provider": "featherless_ai", "base_model": "qwerky-qwq-32b", "max_input_tokens": 32768, "max_output_tokens": 4096}, "fireworks-ai-4.1b-to-16b" : {"mode": "", "provider": "fireworks", "base_model": "fireworks-ai-4.1b-to-16b", "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "fireworks-ai-56b-to-176b" : {"mode": "", "provider": "fireworks", "base_model": "fireworks-ai-56b-to-176b", "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "fireworks-ai-above-16b" : {"mode": "", "provider": "fireworks", "base_model": "fireworks-ai-above-16b", "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "fireworks-ai-default" : {"mode": "", "provider": "fireworks", "base_model": "fireworks-ai-default", "input_cost_per_token": 0, "output_cost_per_token": 0}, "fireworks-ai-embedding-150m-to-350m" : {"mode": "", "provider": "fireworks", "base_model": "fireworks-ai-embedding-150m-to-350m", "input_cost_per_token": 0.000000016, "output_cost_per_token": 0}, "fireworks-ai-embedding-up-to-150m" : {"mode": "", "provider": "fireworks", "base_model": "fireworks-ai-embedding-up-to-150m", "input_cost_per_token": 0.000000008, "output_cost_per_token": 0}, "fireworks-ai-moe-up-to-56b" : {"mode": "", "provider": "fireworks", "base_model": "fireworks-ai-moe-up-to-56b", "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005}, "fireworks-ai-up-to-4b" : {"mode": "", "provider": "fireworks", "base_model": "fireworks-ai-up-to-4b", "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "flux-dev" : {"mode": "image_generation", "provider": "black_forest_labs", "base_model": "flux-dev", "output_cost_per_image": 0.025}, "flux-kontext-max" : {"mode": "image_edit", "provider": "black_forest_labs", "base_model": "flux-kontext-max", "output_cost_per_image": 0.08}, "flux-kontext-pro" : {"mode": "image_edit", "provider": "black_forest_labs", "base_model": "flux-kontext-pro", "output_cost_per_image": 0.04}, "flux-pro" : {"mode": "image_generation", "provider": "aiml", "base_model": "flux-pro", "output_cost_per_image": 0.065}, "flux-pro-1.0-expand" : {"mode": "image_edit", "provider": "black_forest_labs", "base_model": "flux-pro-1.0-expand", "output_cost_per_image": 0.05}, "flux-pro-1.0-fill" : {"mode": "image_edit", "provider": "black_forest_labs", "base_model": "flux-pro-1.0-fill", "output_cost_per_image": 0.05}, "flux-pro-1.1" : {"mode": "image_generation", "provider": "black_forest_labs", "base_model": "flux-pro-1.1", "output_cost_per_image": 0.04}, "flux-pro-1.1-ultra" : {"mode": "image_generation", "provider": "black_forest_labs", "base_model": "flux-pro-1.1-ultra", "output_cost_per_image": 0.06}, "flux-pro/v1.1" : {"mode": "image_generation", "provider": "aiml", "base_model": "flux-pro/v1.1", "output_cost_per_image": 0.052}, "flux-pro/v1.1-ultra" : {"mode": "image_generation", "provider": "aiml", "base_model": "flux-pro/v1.1-ultra", "output_cost_per_image": 0.063}, "flux-realism" : {"mode": "image_generation", "provider": "aiml", "base_model": "flux-realism", "output_cost_per_image": 0.046}, "flux.2-pro" : {"mode": "image_generation", "provider": "azure", "base_model": "flux.2-pro", "output_cost_per_image": 0.04}, "flux/dev" : {"mode": "image_generation", "provider": "aiml", "base_model": "flux/dev", "output_cost_per_image": 0.033}, "flux/kontext-max/text-to-image" : {"mode": "image_generation", "provider": "aiml", "base_model": "flux/kontext-max/text-to-image", "output_cost_per_image": 0.104}, "flux/kontext-pro/text-to-image" : {"mode": "image_generation", "provider": "aiml", "base_model": "flux/kontext-pro/text-to-image", "output_cost_per_image": 0.052}, "flux/schnell" : {"mode": "image_generation", "provider": "aiml", "base_model": "flux/schnell", "output_cost_per_image": 0.004}, "ft:babbage-002" : {"mode": "completion", "provider": "text-completion-openai", "base_model": "babbage-002", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.0000016, "output_cost_per_token": 0.0000016, "input_cost_per_token_batches": 0.0000002, "output_cost_per_token_batches": 0.0000002}, "ft:davinci-002" : {"mode": "completion", "provider": "text-completion-openai", "base_model": "davinci-002", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.000012, "output_cost_per_token": 0.000012, "input_cost_per_token_batches": 0.000001, "output_cost_per_token_batches": 0.000001}, "ft:gpt-3.5-turbo" : {"mode": "chat", "provider": "openai", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000006, "input_cost_per_token_batches": 0.0000015, "output_cost_per_token_batches": 0.000003}, "ft:gpt-3.5-turbo-0125" : {"mode": "chat", "provider": "openai", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000006}, "ft:gpt-3.5-turbo-0613" : {"mode": "chat", "provider": "openai", "base_model": "gpt-3.5-turbo", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000006}, "ft:gpt-3.5-turbo-1106" : {"mode": "chat", "provider": "openai", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000006}, "ft:gpt-4-0613" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006}, "ft:gpt-4.1-2025-04-14" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4.1", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.00000075, "input_cost_per_token_batches": 0.0000015, "output_cost_per_token_batches": 0.000006}, "ft:gpt-4.1-mini-2025-04-14" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4.1-mini", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000032, "cache_read_input_token_cost": 0.0000002, "input_cost_per_token_batches": 0.0000004, "output_cost_per_token_batches": 0.0000016}, "ft:gpt-4.1-nano-2025-04-14" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4.1-nano", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000008, "cache_read_input_token_cost": 0.00000005, "input_cost_per_token_batches": 0.0000001, "output_cost_per_token_batches": 0.0000004}, "ft:gpt-4o-2024-08-06" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000375, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.000001875, "input_cost_per_token_batches": 0.000001875, "output_cost_per_token_batches": 0.0000075}, "ft:gpt-4o-2024-11-20" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000375, "output_cost_per_token": 0.000015, "cache_creation_input_token_cost": 0.000001875}, "ft:gpt-4o-mini-2024-07-18" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000015, "input_cost_per_token_batches": 0.00000015, "output_cost_per_token_batches": 0.0000006}, "ft:o4-mini-2025-04-16" : {"mode": "chat", "provider": "openai", "base_model": "o4-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000016, "cache_read_input_token_cost": 0.000001, "input_cost_per_token_batches": 0.000002, "output_cost_per_token_batches": 0.000008}, "gemini-1.5-flash" : {"mode": "embedding", "provider": "gemini", "base_model": "gemini-1.5-flash", "max_input_tokens": 8192, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0, "input_cost_per_token_above_128k_tokens": 0.00000015}, "gemini-2.0-flash" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-2.0-flash", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "input_cost_per_audio_token": 0.0000007, "cache_read_input_token_cost": 0.000000025}, "gemini-2.0-flash-001" : {"mode": "chat", "provider": "vertex", "base_model": "gemini-2.0-flash", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "input_cost_per_audio_token": 0.000001, "cache_read_input_token_cost": 0.0000000375}, "gemini-2.0-flash-exp-image-generation" : {"mode": "image_generation", "provider": "gemini", "base_model": "gemini-2.0-flash-exp-image-generation", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_image": 0.039, "output_cost_per_token": 0}, "gemini-2.0-flash-lite" : {"mode": "chat", "provider": "vertex", "base_model": "gemini-2.0-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003, "input_cost_per_audio_token": 0.000000075, "cache_read_input_token_cost": 0.00000001875}, "gemini-2.0-flash-lite-001" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-2.0-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003, "input_cost_per_audio_token": 0.000000075, "cache_read_input_token_cost": 0.00000001875}, "gemini-2.5-computer-use-preview-10-2025" : {"mode": "chat", "provider": "vertex", "base_model": "gemini-2.5-computer-use", "max_input_tokens": 128000, "max_output_tokens": 64000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "input_cost_per_token_above_200k_tokens": 0.0000025, "output_cost_per_token_above_200k_tokens": 0.000015}, "gemini-2.5-flash" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-2.5-flash", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.000001, "cache_read_input_token_cost": 0.00000003}, "gemini-2.5-flash-image" : {"mode": "image_generation", "provider": "gemini", "base_model": "gemini-2.5-flash-image", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000003, "output_cost_per_image": 0.039, "output_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.000001, "cache_read_input_token_cost": 0.00000003, "output_cost_per_image_token": 0.00003}, "gemini-2.5-flash-lite" : {"mode": "chat", "provider": "vertex", "base_model": "gemini-2.5-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "input_cost_per_audio_token": 0.0000003, "cache_read_input_token_cost": 0.00000001}, "gemini-2.5-flash-lite-preview-06-17" : {"mode": "chat", "provider": "vertex", "base_model": "gemini-2.5-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "input_cost_per_audio_token": 0.0000005, "cache_read_input_token_cost": 0.000000025}, "gemini-2.5-flash-lite-preview-09-2025" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-2.5-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "input_cost_per_audio_token": 0.0000003, "cache_read_input_token_cost": 0.00000001}, "gemini-2.5-flash-native-audio-latest" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-2.5-flash-native-audio", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.000001}, "gemini-2.5-flash-native-audio-preview-09-2025" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-2.5-flash-native-audio", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.000001}, "gemini-2.5-flash-native-audio-preview-12-2025" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-2.5-flash-native-audio", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.000001}, "gemini-2.5-flash-preview-09-2025" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-2.5-flash", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.000001, "cache_read_input_token_cost": 0.000000075}, "gemini-2.5-flash-preview-tts" : {"mode": "audio_speech", "provider": "gemini", "base_model": "gemini-2.5-flash-tts", "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025}, "gemini-2.5-pro" : {"mode": "chat", "provider": "github_copilot", "base_model": "gemini-2.5-pro", "max_input_tokens": 128000, "max_output_tokens": 64000}, "gemini-2.5-pro-preview-tts" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-2.5-pro-tts", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.0000007, "cache_read_input_token_cost": 0.000000125, "input_cost_per_token_above_200k_tokens": 0.0000025, "output_cost_per_token_above_200k_tokens": 0.000015, "cache_read_input_token_cost_above_200k_tokens": 0.00000025}, "gemini-3-flash-preview" : {"mode": "chat", "provider": "github_copilot", "base_model": "gemini-3-flash", "max_input_tokens": 128000, "max_output_tokens": 64000}, "gemini-3-pro-image-preview" : {"mode": "image_generation", "provider": "vertex", "base_model": "gemini-3-pro-image", "max_input_tokens": 65536, "max_output_tokens": 32768, "input_cost_per_image": 0.0011, "input_cost_per_token": 0.000002, "output_cost_per_image": 0.134, "output_cost_per_token": 0.000012, "output_cost_per_image_token": 0.00012, "input_cost_per_token_batches": 0.000001, "output_cost_per_token_batches": 0.000006}, "gemini-3-pro-preview" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-3-pro", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000002, "input_cost_per_token_batches": 0.000001, "input_cost_per_token_priority": 0.0000036, "output_cost_per_token_batches": 0.000006, "output_cost_per_token_priority": 0.0000216, "cache_read_input_token_cost_priority": 0.00000036, "input_cost_per_token_above_200k_tokens": 0.000004, "output_cost_per_token_above_200k_tokens": 0.000018, "cache_read_input_token_cost_above_200k_tokens": 0.0000004, "input_cost_per_token_above_200k_tokens_priority": 0.0000072, "output_cost_per_token_above_200k_tokens_priority": 0.0000324, "cache_read_input_token_cost_above_200k_tokens_priority": 0.00000072}, "gemini-3.1-flash-image-preview" : {"mode": "image_generation", "provider": "vertex", "base_model": "gemini-3.1-flash-image", "max_input_tokens": 65536, "max_output_tokens": 32768, "input_cost_per_image": 0.00056, "input_cost_per_token": 0.0000005, "output_cost_per_image": 0.0672, "output_cost_per_token": 0.000003, "output_cost_per_image_token": 0.00006}, "gemini-3.1-flash-lite" : {"mode": "chat", "provider": "vertex", "base_model": "gemini-3.1-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000027, "input_cost_per_audio_token": 0.0000009, "cache_read_input_token_cost": 0.000000045}, "gemini-3.1-flash-lite-preview" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-3.1-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.0000015, "input_cost_per_audio_token": 0.0000005, "cache_read_input_token_cost": 0.000000025}, "gemini-3.1-flash-live-preview" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-3.1-flash-live", "max_input_tokens": 131072, "max_output_tokens": 65536, "input_cost_per_token": 0.00000075, "output_cost_per_token": 0.0000045, "input_cost_per_audio_token": 0.000003, "input_cost_per_image_token": 0.000001, "output_cost_per_audio_token": 0.000012, "input_cost_per_video_per_second": 0.000033333333333333335}, "gemini-3.1-pro-preview" : {"mode": "chat", "provider": "github_copilot", "base_model": "gemini-3.1-pro", "max_input_tokens": 128000, "max_output_tokens": 64000}, "gemini-3.1-pro-preview-customtools" : {"mode": "chat", "provider": "vertex", "base_model": "gemini-3.1-pro-customtools", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.000002, "output_cost_per_image": 0.00012, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000002, "input_cost_per_token_batches": 0.000001, "input_cost_per_token_priority": 0.0000036, "output_cost_per_token_batches": 0.000006, "output_cost_per_token_priority": 0.0000216, "cache_read_input_token_cost_priority": 0.00000036, "input_cost_per_token_above_200k_tokens": 0.000004, "output_cost_per_token_above_200k_tokens": 0.000018, "cache_read_input_token_cost_above_200k_tokens": 0.0000004, "input_cost_per_token_above_200k_tokens_priority": 0.0000072, "output_cost_per_token_above_200k_tokens_priority": 0.0000324, "cache_creation_input_token_cost_above_200k_tokens": 0.00000025, "cache_read_input_token_cost_above_200k_tokens_priority": 0.00000072}, "gemini-3.5-flash" : {"mode": "chat", "provider": "vertex", "base_model": "gemini-3.5-flash", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000009, "input_cost_per_audio_token": 0.000001, "cache_read_input_token_cost": 0.00000015, "input_cost_per_token_priority": 0.0000027, "output_cost_per_token_priority": 0.0000162, "cache_read_input_token_cost_priority": 0.00000027}, "gemini-embedding-001" : {"mode": "embedding", "provider": "vertex", "base_model": "gemini-embedding-001", "max_input_tokens": 2048, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0}, "gemini-embedding-2" : {"mode": "embedding", "provider": "vertex", "base_model": "gemini-embedding-2", "max_input_tokens": 8192, "input_cost_per_image": 0.00012, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0, "input_cost_per_audio_per_second": 0.00016, "input_cost_per_video_per_second": 0.00079}, "gemini-embedding-2-preview" : {"mode": "embedding", "provider": "gemini", "base_model": "gemini-embedding-2", "max_input_tokens": 8192, "input_cost_per_image": 0.00012, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0, "input_cost_per_audio_per_second": 0.00016, "input_cost_per_video_per_second": 0.00079}, "gemini-exp-1114" : {"mode": "chat", "provider": "gemini", "base_model": "gemini", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token_above_128k_tokens": 0}, "gemini-exp-1206" : {"mode": "chat", "provider": "gemini", "base_model": "gemini", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.000001, "cache_read_input_token_cost": 0.00000003}, "gemini-flash-experimental" : {"mode": "embedding", "provider": "vertex", "base_model": "gemini-flash", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0, "input_cost_per_character": 0}, "gemini-flash-latest" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-flash", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.000001, "cache_read_input_token_cost": 0.000000075}, "gemini-flash-lite-latest" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "input_cost_per_audio_token": 0.0000003, "cache_read_input_token_cost": 0.000000025}, "gemini-gemma-2-27b-it" : {"mode": "chat", "provider": "gemini", "base_model": "gemma-2-27b-it", "max_output_tokens": 8192, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000105}, "gemini-gemma-2-9b-it" : {"mode": "chat", "provider": "gemini", "base_model": "gemma-2-9b-it", "max_output_tokens": 8192, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000105}, "gemini-live-2.5-flash-preview-native-audio-09-2025" : {"mode": "realtime", "provider": "vertex", "base_model": "gemini-live-2.5-flash-native-audio", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.000002, "input_cost_per_audio_token": 0.000003, "cache_read_input_token_cost": 0.000000075, "output_cost_per_audio_token": 0.000012}, "gemini-pro-latest" : {"mode": "chat", "provider": "gemini", "base_model": "gemini-pro", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125, "input_cost_per_token_above_200k_tokens": 0.0000025, "output_cost_per_token_above_200k_tokens": 0.000015, "cache_read_input_token_cost_above_200k_tokens": 0.00000025}, "gemini-robotics-er-1.5-preview" : {"mode": "chat", "provider": "vertex", "base_model": "gemini-robotics-er-1.5", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.000001, "cache_read_input_token_cost": 0}, "gemma-3-27b-it" : {"mode": "chat", "provider": "gemini", "base_model": "gemma-3-27b-it", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_image": 0, "input_cost_per_token": 0, "output_cost_per_token": 0, "input_cost_per_character": 0, "input_cost_per_audio_per_second": 0, "input_cost_per_video_per_second": 0, "input_cost_per_image_above_128k_tokens": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token_above_128k_tokens": 0, "input_cost_per_audio_per_second_above_128k_tokens": 0, "input_cost_per_video_per_second_above_128k_tokens": 0}, "gemma-4-26b-a4b-it" : {"mode": "chat", "provider": "vertex", "base_model": "gemma-4", "max_output_tokens": 8192, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000034000000000000003}, "gemma-4-26b-a4b-it-maas" : {"mode": "chat", "provider": "vertex", "base_model": "gemma-4", "max_output_tokens": 8192, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000034000000000000003}, "gemma-4-31b" : {"mode": "chat", "provider": "vertex", "base_model": "gemma-4", "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "gemma-7b" : {"mode": "chat", "provider": "snowflake", "base_model": "gemma-7b", "max_input_tokens": 8000, "max_output_tokens": 8192}, "gemma-7b-it" : {"mode": "chat", "provider": "groq", "base_model": "gemma-7b-it", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000008}, "gemma3-4b" : {"mode": "chat", "provider": "llamagate", "base_model": "gemma-3-4b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000003, "output_cost_per_token": 0.00000008}, "gen3a_turbo" : {"mode": "video_generation", "provider": "runway", "base_model": "gen3a-turbo", "output_cost_per_video_per_second": 0.05}, "gen4_aleph" : {"mode": "video_generation", "provider": "runway", "base_model": "gen4-aleph", "output_cost_per_video_per_second": 0.15}, "gen4_image" : {"mode": "image_generation", "provider": "runway", "base_model": "gen4-image", "input_cost_per_image": 0.05, "output_cost_per_image": 0.05}, "gen4_image_turbo" : {"mode": "image_generation", "provider": "runway", "base_model": "gen4-image-turbo", "input_cost_per_image": 0.02, "output_cost_per_image": 0.02}, "gen4_turbo" : {"mode": "video_generation", "provider": "runway", "base_model": "gen4-turbo", "output_cost_per_video_per_second": 0.05}, "generative" : {"mode": "audio_speech", "provider": "aws_polly", "base_model": "generative", "input_cost_per_character": 0.00003}, "glm-4-32b-0414-128k" : {"mode": "chat", "provider": "zai", "base_model": "glm-4-32b-0414-128k", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "glm-4-7-251222" : {"mode": "chat", "provider": "volcengine", "base_model": "glm-4-7", "max_input_tokens": 204800, "max_output_tokens": 131072, "input_cost_per_token": 0, "output_cost_per_token": 0}, "glm-4.5" : {"mode": "chat", "provider": "zai", "base_model": "glm-4.5", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022}, "glm-4.5-air" : {"mode": "chat", "provider": "zai", "base_model": "glm-4.5-air", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000011}, "glm-4.5-airx" : {"mode": "chat", "provider": "zai", "base_model": "glm-4.5-airx", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000045}, "glm-4.5-flash" : {"mode": "chat", "provider": "zai", "base_model": "glm-4.5-flash", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "glm-4.5-x" : {"mode": "chat", "provider": "zai", "base_model": "glm-4.5-x", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000022, "output_cost_per_token": 0.0000089}, "glm-4.5v" : {"mode": "chat", "provider": "zai", "base_model": "glm-4.5v", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000018}, "glm-4.6" : {"mode": "chat", "provider": "zai", "base_model": "glm-4.6", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.00000011, "cache_creation_input_token_cost": 0}, "glm-4.7" : {"mode": "chat", "provider": "zai", "base_model": "glm-4.7", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.00000011, "cache_creation_input_token_cost": 0}, "glm-4p7" : {"mode": "chat", "provider": "fireworks", "base_model": "glm-4.7", "max_input_tokens": 202800, "max_output_tokens": 202800, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.0000003}, "glm-5" : {"mode": "chat", "provider": "zai", "base_model": "glm-5", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.0000032, "cache_read_input_token_cost": 0.0000002, "cache_creation_input_token_cost": 0}, "glm-5-code" : {"mode": "chat", "provider": "zai", "base_model": "glm-5-code", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0}, "glm-5p1" : {"mode": "chat", "provider": "fireworks", "base_model": "glm-5.1", "max_input_tokens": 202800, "max_output_tokens": 202800, "input_cost_per_token": 0.0000014, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000026}, "global-standard/gpt-4o-2024-08-06" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125}, "global-standard/gpt-4o-2024-11-20" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125}, "global-standard/gpt-4o-mini" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "global.amazon.nova-2-lite-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-2-lite", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.000000075}, "global.anthropic.claude-haiku-4-5-20251001-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.0000001, "cache_creation_input_token_cost": 0.00000125, "cache_creation_input_token_cost_above_1hr": 0.000002}, "global.anthropic.claude-opus-4-5-20251101-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "global.anthropic.claude-opus-4-6-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-6", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "global.anthropic.claude-opus-4-7" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-7", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "global.anthropic.claude-opus-4-8" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-8", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "global.anthropic.claude-sonnet-4-20250514-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "global.anthropic.claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_creation_input_token_cost_above_1hr": 0.000006, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075, "cache_creation_input_token_cost_above_1hr_above_200k_tokens": 0.000012}, "global.anthropic.claude-sonnet-4-6" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-6", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "global/gpt-4o-2024-08-06" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125}, "global/gpt-4o-2024-11-20" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125}, "global/gpt-5.1" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.1", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "global/gpt-5.1-chat" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.1-chat", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "global/gpt-5.1-codex" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.1-codex", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "global/gpt-5.1-codex-mini" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.1-codex-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.000000025}, "global/grok-3" : {"mode": "chat", "provider": "azure", "base_model": "grok-3", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "global/grok-3-mini" : {"mode": "chat", "provider": "azure", "base_model": "grok-3-mini", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000127}, "google.gemini-2.5-flash" : {"mode": "chat", "provider": "oci", "base_model": "gemini-2.5-flash", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "google.gemini-2.5-flash-lite" : {"mode": "chat", "provider": "oci", "base_model": "gemini-2.5-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003}, "google.gemini-2.5-pro" : {"mode": "chat", "provider": "oci", "base_model": "gemini-2.5-pro", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001}, "google.gemma-3-12b-it" : {"mode": "chat", "provider": "bedrock", "base_model": "gemma-3-12b-it", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000009, "output_cost_per_token": 0.00000029}, "google.gemma-3-27b-it" : {"mode": "chat", "provider": "bedrock", "base_model": "gemma-3-27b-it", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000023, "output_cost_per_token": 0.00000038}, "google.gemma-3-4b-it" : {"mode": "chat", "provider": "bedrock", "base_model": "gemma-3-4b-it", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000008}, "google/chirp-3" : {"mode": "chat", "provider": "openrouter", "base_model": "chirp-3", "max_input_tokens": 0, "input_cost_per_token": 0.016}, "google/flan-t5-xl-3b" : {"mode": "chat", "provider": "watsonx", "base_model": "flan-t5-xl-3b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006}, "google/gemini-2.0-flash" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "gemini-2.0-flash", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "google/gemini-2.0-flash-001" : {"mode": "chat", "provider": "deepinfra", "base_model": "gemini-2.0-flash", "max_input_tokens": 1000000, "max_output_tokens": 1000000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004}, "google/gemini-2.0-flash-lite" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "gemini-2.0-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003}, "google/gemini-2.5-flash" : {"mode": "chat", "provider": "deepinfra", "base_model": "gemini-2.5-flash", "max_input_tokens": 1000000, "max_output_tokens": 1000000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000025}, "google/gemini-2.5-flash-image" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-2.5-flash-image", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000003, "output_cost_per_image": 0.0000003, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.00000008333333333333334}, "google/gemini-2.5-flash-lite" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-2.5-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000001, "output_cost_per_image": 0.0000001, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0.00000001, "cache_creation_input_token_cost": 0.00000008333333333333334}, "google/gemini-2.5-flash-lite-preview-09-2025" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-2.5-flash-lite-preview-09-2025", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.0000001, "output_cost_per_image": 0.0000001, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0.00000001, "cache_creation_input_token_cost": 0.00000008333333333333334}, "google/gemini-2.5-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-2.5-pro", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.00000125, "output_cost_per_image": 0.00000125, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.0000007, "cache_read_input_token_cost": 0.000000125, "cache_creation_input_token_cost": 0.000000375}, "google/gemini-2.5-pro-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-2.5-pro-preview", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.00000125, "output_cost_per_image": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125, "cache_creation_input_token_cost": 0.000000375}, "google/gemini-2.5-pro-preview-05-06" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-2.5-pro-preview-05-06", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.00000125, "output_cost_per_image": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125, "cache_creation_input_token_cost": 0.000000375}, "google/gemini-3-flash-preview" : {"mode": "chat", "provider": "gmi", "base_model": "gemini-3-flash", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.000003}, "google/gemini-3-pro" : {"mode": "chat", "provider": "replicate", "base_model": "gemini-3-pro", "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000012}, "google/gemini-3-pro-image-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-3-pro-image-preview", "max_input_tokens": 65536, "max_output_tokens": 32768, "input_cost_per_token": 0.000002, "output_cost_per_image": 0.000002, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000002, "cache_creation_input_token_cost": 0.000000375}, "google/gemini-3-pro-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-3-pro", "max_input_tokens": 1048576, "max_output_tokens": 65535, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000002, "input_cost_per_token_batches": 0.000001, "output_cost_per_token_batches": 0.000006, "input_cost_per_token_above_200k_tokens": 0.000004, "output_cost_per_token_above_200k_tokens": 0.000018, "cache_read_input_token_cost_above_200k_tokens": 0.0000004, "cache_creation_input_token_cost_above_200k_tokens": 0.00000025}, "google/gemini-3.1-flash-image-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-3.1-flash-image-preview", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.000003}, "google/gemini-3.1-flash-lite" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-3.1-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.00000025, "output_cost_per_image": 0.00000025, "output_cost_per_token": 0.0000015, "input_cost_per_audio_token": 0.0000005, "cache_read_input_token_cost": 0.000000025, "cache_creation_input_token_cost": 0.00000008333333333333334}, "google/gemini-3.1-flash-lite-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-3.1-flash-lite", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.00000025, "output_cost_per_image": 0.00000025, "output_cost_per_token": 0.0000015, "input_cost_per_audio_token": 0.0000005, "cache_read_input_token_cost": 0.000000025, "cache_creation_input_token_cost": 0.00000008333333333333334}, "google/gemini-3.1-flash-tts-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-3.1-flash-tts-preview", "max_input_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.00002}, "google/gemini-3.1-pro-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-3.1-pro", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.000002, "output_cost_per_image": 0.000002, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000002, "cache_creation_input_token_cost": 0.000000375, "input_cost_per_token_above_200k_tokens": 0.000004, "output_cost_per_token_above_200k_tokens": 0.000018, "cache_read_input_token_cost_above_200k_tokens": 0.0000004, "cache_creation_input_token_cost_above_200k_tokens": 0.00000025}, "google/gemini-3.1-pro-preview-customtools" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-3.1-pro-preview-customtools", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.000002, "output_cost_per_image": 0.000002, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000002, "cache_creation_input_token_cost": 0.000000375}, "google/gemini-3.5-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-3.5-flash", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.0000015, "output_cost_per_image": 0.0000015, "output_cost_per_token": 0.000009, "cache_read_input_token_cost": 0.00000015, "cache_creation_input_token_cost": 0.00000008333333333333334}, "google/gemini-embedding-001" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-embedding-001", "max_input_tokens": 20000, "input_cost_per_token": 0.00000015}, "google/gemini-embedding-2" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-embedding-2", "max_input_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_image": 0.00000045}, "google/gemini-embedding-2-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-embedding-2-preview", "max_input_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_image": 0.00000045}, "google/gemma-2-27b-it" : {"mode": "chat", "provider": "openrouter", "base_model": "gemma-2-27b-it", "max_input_tokens": 8192, "max_output_tokens": 2048, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000065}, "google/gemma-2-9b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "gemma-2-9b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "google/gemma-3-12b-it" : {"mode": "chat", "provider": "openrouter", "base_model": "gemma-3-12b-it", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000013}, "google/gemma-3-27b-it" : {"mode": "chat", "provider": "novita", "base_model": "gemma-3-27b-it", "max_input_tokens": 98304, "max_output_tokens": 16384, "input_cost_per_token": 0.000000119, "output_cost_per_token": 0.0000002}, "google/gemma-3-4b-it" : {"mode": "chat", "provider": "deepinfra", "base_model": "gemma-3-4b-it", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000008}, "google/gemma-3n-e4b-it" : {"mode": "chat", "provider": "openrouter", "base_model": "gemma-3n-e4b-it", "max_input_tokens": 32768, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000012}, "google/gemma-4-26b-a4b-it" : {"mode": "chat", "provider": "openrouter", "base_model": "gemma-4-26b-a4b-it", "max_input_tokens": 262144, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000033}, "google/gemma-4-26b-a4b-it-maas" : {"mode": "chat", "provider": "vertex", "base_model": "gemma-4", "max_output_tokens": 8192, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000034000000000000003}, "google/gemma-4-31b-it" : {"mode": "chat", "provider": "openrouter", "base_model": "gemma-4-31b-it", "max_input_tokens": 256000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.00000036, "cache_read_input_token_cost": 0.00000009}, "google/gemma-7b-it" : {"mode": "chat", "provider": "anyscale", "base_model": "gemma-7b-it", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "google/imagen-3" : {"mode": "image_generation", "provider": "replicate", "base_model": "imagen-3", "output_cost_per_image": 0.05}, "google/imagen-3-fast" : {"mode": "image_generation", "provider": "replicate", "base_model": "imagen-3-fast", "output_cost_per_image": 0.025}, "google/imagen-4" : {"mode": "image_generation", "provider": "replicate", "base_model": "imagen-4", "output_cost_per_image": 0.04}, "google/imagen-4-fast" : {"mode": "image_generation", "provider": "replicate", "base_model": "imagen-4-fast", "output_cost_per_image": 0.02}, "google/imagen-4-ultra" : {"mode": "image_generation", "provider": "replicate", "base_model": "imagen-4-ultra", "output_cost_per_image": 0.06}, "google/imagen-4.0-ultra-generate-001" : {"mode": "image_generation", "provider": "aiml", "base_model": "imagen-4.0-ultra-generate", "output_cost_per_image": 0.078}, "google/nano-banana" : {"mode": "image_generation", "provider": "replicate", "base_model": "nano-banana", "output_cost_per_image": 0.039}, "google/nano-banana-pro" : {"mode": "image_generation", "provider": "replicate", "base_model": "nano-banana-pro", "output_cost_per_image": 0.15, "output_cost_per_image_above_1024_and_1024_pixels": 0.15, "output_cost_per_image_above_2048_and_2048_pixels": 0.15, "output_cost_per_image_above_4096_and_4096_pixels": 0.3}, "google/text-embedding-005" : {"mode": "embedding", "provider": "vercel_ai_gateway", "base_model": "text-embedding-005", "max_input_tokens": 0, "max_output_tokens": 0, "input_cost_per_token": 0.000000025, "output_cost_per_token": 0}, "google/text-multilingual-embedding-002" : {"mode": "embedding", "provider": "vercel_ai_gateway", "base_model": "text-multilingual-embedding-002", "max_input_tokens": 0, "max_output_tokens": 0, "input_cost_per_token": 0.000000025, "output_cost_per_token": 0}, "google/veo-2" : {"mode": "video_generation", "provider": "replicate", "base_model": "veo-2", "output_cost_per_video_per_second": 0.5}, "google/veo-3" : {"mode": "video_generation", "provider": "replicate", "base_model": "veo-3", "output_cost_per_video_per_second": 0.75}, "google/veo-3-fast" : {"mode": "video_generation", "provider": "replicate", "base_model": "veo-3-fast", "output_cost_per_video_per_second": 0.4}, "google/veo-3.1" : {"mode": "video_generation", "provider": "replicate", "base_model": "veo-3.1", "output_cost_per_video_per_second": 0.75}, "google/veo-3.1-fast" : {"mode": "video_generation", "provider": "replicate", "base_model": "veo-3.1-fast", "output_cost_per_video_per_second": 0.4}, "gpt-3.5-turbo" : {"mode": "chat", "provider": "openai", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "gpt-3.5-turbo-0125" : {"mode": "chat", "provider": "azure", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "gpt-3.5-turbo-0613" : {"mode": "chat", "provider": "github_copilot", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16384, "max_output_tokens": 4096}, "gpt-3.5-turbo-1106" : {"mode": "chat", "provider": "openai", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000002}, "gpt-3.5-turbo-16k" : {"mode": "chat", "provider": "openai", "base_model": "gpt-3.5-turbo-16k", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000004}, "gpt-3.5-turbo-instruct" : {"mode": "completion", "provider": "text-completion-openai", "base_model": "gpt-3.5-turbo-instruct", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002}, "gpt-3.5-turbo-instruct-0914" : {"mode": "completion", "provider": "text-completion-openai", "base_model": "gpt-3.5-turbo-instruct", "max_input_tokens": 8192, "max_output_tokens": 4097, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002}, "gpt-35-turbo" : {"mode": "chat", "provider": "azure", "base_model": "gpt-3.5-turbo", "max_input_tokens": 4097, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "gpt-35-turbo-0125" : {"mode": "chat", "provider": "azure", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "gpt-35-turbo-1106" : {"mode": "chat", "provider": "azure", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000002}, "gpt-35-turbo-16k" : {"mode": "chat", "provider": "azure", "base_model": "gpt-3.5-turbo-16k", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000004}, "gpt-35-turbo-16k-0613" : {"mode": "chat", "provider": "azure", "base_model": "gpt-3.5-turbo-16k", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000004}, "gpt-35-turbo-instruct" : {"mode": "completion", "provider": "azure_text", "base_model": "gpt-3.5-turbo-instruct", "max_input_tokens": 4097, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002}, "gpt-35-turbo-instruct-0914" : {"mode": "completion", "provider": "azure_text", "base_model": "gpt-3.5-turbo-instruct", "max_input_tokens": 4097, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002}, "gpt-4" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006}, "gpt-4-0125-preview" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003}, "gpt-4-0314" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006}, "gpt-4-0613" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006}, "gpt-4-1106-preview" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003}, "gpt-4-32k" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4-32k", "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.00006, "output_cost_per_token": 0.00012}, "gpt-4-32k-0613" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4-32k", "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.00006, "output_cost_per_token": 0.00012}, "gpt-4-o-preview" : {"mode": "chat", "provider": "github_copilot", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 4096}, "gpt-4-turbo" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4-turbo", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003}, "gpt-4-turbo-2024-04-09" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4-turbo", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003}, "gpt-4-turbo-preview" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4-turbo", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003}, "gpt-4-turbo-vision-preview" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4-turbo-vision", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003}, "gpt-4.1" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4.1", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "cache_read_input_token_cost": 0.0000005, "input_cost_per_token_batches": 0.000001, "output_cost_per_token_batches": 0.000004}, "gpt-4.1-2025-04-14" : {"mode": "chat", "provider": "github_copilot", "base_model": "gpt-4.1", "max_input_tokens": 128000, "max_output_tokens": 16384}, "gpt-4.1-mini" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4.1-mini", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000016, "cache_read_input_token_cost": 0.0000001, "input_cost_per_token_batches": 0.0000002, "output_cost_per_token_batches": 0.0000008}, "gpt-4.1-mini-2025-04-14" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4.1-mini", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000016, "cache_read_input_token_cost": 0.0000001, "input_cost_per_token_batches": 0.0000002, "output_cost_per_token_batches": 0.0000008}, "gpt-4.1-nano" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4.1-nano", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0.000000025, "input_cost_per_token_batches": 0.00000005, "input_cost_per_token_priority": 0.0000002, "output_cost_per_token_batches": 0.0000002, "output_cost_per_token_priority": 0.0000008, "cache_read_input_token_cost_priority": 0.00000005}, "gpt-4.1-nano-2025-04-14" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4.1-nano", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0.000000025, "input_cost_per_token_batches": 0.00000005, "output_cost_per_token_batches": 0.0000002}, "gpt-4.5-preview" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4.5", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.000075, "output_cost_per_token": 0.00015, "cache_read_input_token_cost": 0.0000375, "input_cost_per_token_batches": 0.0000375, "output_cost_per_token_batches": 0.000075}, "gpt-41-copilot" : {"mode": "chat", "provider": "github_copilot", "base_model": "gpt-41-copilot"}, "gpt-4o" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125, "input_cost_per_token_batches": 0.00000125, "input_cost_per_token_priority": 0.00000425, "output_cost_per_token_batches": 0.000005, "output_cost_per_token_priority": 0.000017, "cache_read_input_token_cost_priority": 0.000002125}, "gpt-4o-2024-05-13" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015, "input_cost_per_token_batches": 0.0000025, "input_cost_per_token_priority": 0.00000875, "output_cost_per_token_batches": 0.0000075, "output_cost_per_token_priority": 0.00002625}, "gpt-4o-2024-08-06" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125, "input_cost_per_token_batches": 0.00000125, "output_cost_per_token_batches": 0.000005}, "gpt-4o-2024-11-20" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000275, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.00000125}, "gpt-4o-audio-preview" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-audio", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.00004, "output_cost_per_audio_token": 0.00008}, "gpt-4o-audio-preview-2024-12-17" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-audio", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.00004, "output_cost_per_audio_token": 0.00008}, "gpt-4o-audio-preview-2025-06-03" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-audio", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.00004, "output_cost_per_audio_token": 0.00008}, "gpt-4o-mini" : {"mode": "chat", "provider": "github_copilot", "base_model": "gpt-4o-mini", "max_input_tokens": 128000, "max_output_tokens": 4096}, "gpt-4o-mini-2024-07-18" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "cache_read_input_token_cost": 0.000000075, "input_cost_per_token_batches": 0.000000075, "output_cost_per_token_batches": 0.0000003}, "gpt-4o-mini-audio-preview" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-mini-audio", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "input_cost_per_audio_token": 0.00001, "output_cost_per_audio_token": 0.00002}, "gpt-4o-mini-audio-preview-2024-12-17" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-mini-audio", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "input_cost_per_audio_token": 0.00001, "output_cost_per_audio_token": 0.00002}, "gpt-4o-mini-realtime-preview" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-mini-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000024, "input_cost_per_audio_token": 0.00001, "cache_read_input_token_cost": 0.0000003, "output_cost_per_audio_token": 0.00002, "cache_creation_input_audio_token_cost": 0.0000003}, "gpt-4o-mini-realtime-preview-2024-12-17" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-mini-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000024, "input_cost_per_audio_token": 0.00001, "cache_read_input_token_cost": 0.0000003, "output_cost_per_audio_token": 0.00002, "cache_creation_input_audio_token_cost": 0.0000003}, "gpt-4o-mini-search-preview" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-mini-search", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "cache_read_input_token_cost": 0.000000075, "input_cost_per_token_batches": 0.000000075, "output_cost_per_token_batches": 0.0000003}, "gpt-4o-mini-search-preview-2025-03-11" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-mini-search", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "cache_read_input_token_cost": 0.000000075, "input_cost_per_token_batches": 0.000000075, "output_cost_per_token_batches": 0.0000003}, "gpt-4o-mini-transcribe" : {"mode": "audio_transcription", "provider": "azure", "base_model": "gpt-4o-mini-transcribe", "max_input_tokens": 16000, "max_output_tokens": 2000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.000005, "input_cost_per_audio_token": 0.00000125}, "gpt-4o-mini-transcribe-2025-03-20" : {"mode": "audio_transcription", "provider": "openai", "base_model": "gpt-4o-mini-transcribe", "max_input_tokens": 16000, "max_output_tokens": 2000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.000005, "input_cost_per_audio_token": 0.00000125}, "gpt-4o-mini-transcribe-2025-12-15" : {"mode": "audio_transcription", "provider": "openai", "base_model": "gpt-4o-mini-transcribe", "max_input_tokens": 16000, "max_output_tokens": 2000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.000005, "input_cost_per_audio_token": 0.00000125}, "gpt-4o-mini-tts" : {"mode": "audio_speech", "provider": "azure", "base_model": "gpt-4o-mini-tts", "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "output_cost_per_second": 0.00025, "output_cost_per_audio_token": 0.000012}, "gpt-4o-mini-tts-2025-03-20" : {"mode": "audio_speech", "provider": "openai", "base_model": "gpt-4o-mini-tts", "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "output_cost_per_second": 0.00025, "output_cost_per_audio_token": 0.000012}, "gpt-4o-mini-tts-2025-12-15" : {"mode": "audio_speech", "provider": "openai", "base_model": "gpt-4o-mini-tts", "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "output_cost_per_second": 0.00025, "output_cost_per_audio_token": 0.000012}, "gpt-4o-realtime-preview" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00002, "input_cost_per_audio_token": 0.00004, "cache_read_input_token_cost": 0.0000025, "output_cost_per_audio_token": 0.00008}, "gpt-4o-realtime-preview-2024-10-01" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00002, "input_cost_per_audio_token": 0.0001, "cache_read_input_token_cost": 0.0000025, "output_cost_per_audio_token": 0.0002, "cache_creation_input_audio_token_cost": 0.00002}, "gpt-4o-realtime-preview-2024-12-17" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00002, "input_cost_per_audio_token": 0.00004, "cache_read_input_token_cost": 0.0000025, "output_cost_per_audio_token": 0.00008}, "gpt-4o-realtime-preview-2025-06-03" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00002, "input_cost_per_audio_token": 0.00004, "cache_read_input_token_cost": 0.0000025, "output_cost_per_audio_token": 0.00008}, "gpt-4o-search-preview" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-search", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125, "input_cost_per_token_batches": 0.00000125, "output_cost_per_token_batches": 0.000005}, "gpt-4o-search-preview-2025-03-11" : {"mode": "chat", "provider": "openai", "base_model": "gpt-4o-search", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125, "input_cost_per_token_batches": 0.00000125, "output_cost_per_token_batches": 0.000005}, "gpt-4o-transcribe" : {"mode": "audio_transcription", "provider": "openai", "base_model": "gpt-4o-transcribe", "max_input_tokens": 16000, "max_output_tokens": 2000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.0000025}, "gpt-4o-transcribe-diarize" : {"mode": "audio_transcription", "provider": "azure", "base_model": "gpt-4o-transcribe", "max_input_tokens": 16000, "max_output_tokens": 2000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.0000025}, "gpt-5" : {"mode": "chat", "provider": "github_copilot", "base_model": "gpt-5", "max_input_tokens": 128000, "max_output_tokens": 128000}, "gpt-5-2025-08-07" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "input_cost_per_token_flex": 0.000000625, "output_cost_per_token_flex": 0.000005, "cache_read_input_token_cost": 0.000000125, "input_cost_per_token_priority": 0.0000025, "output_cost_per_token_priority": 0.00002, "cache_read_input_token_cost_flex": 0.0000000625, "cache_read_input_token_cost_priority": 0.00000025}, "gpt-5-chat" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "gpt-5-chat-latest" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "gpt-5-codex" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5-codex", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "gpt-5-mini" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.000000025}, "gpt-5-mini-2025-08-07" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002, "input_cost_per_token_flex": 0.000000125, "output_cost_per_token_flex": 0.000001, "cache_read_input_token_cost": 0.000000025, "input_cost_per_token_priority": 0.00000045, "output_cost_per_token_priority": 0.0000036, "cache_read_input_token_cost_flex": 0.0000000125, "cache_read_input_token_cost_priority": 0.000000045}, "gpt-5-nano" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5-nano", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0.000000005}, "gpt-5-nano-2025-08-07" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5-nano", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0.000000005}, "gpt-5-pro" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5-pro", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00012}, "gpt-5-pro-2025-10-06" : {"mode": "responses", "provider": "openai", "base_model": "gpt-5-pro", "max_input_tokens": 128000, "max_output_tokens": 272000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00012, "input_cost_per_token_batches": 0.0000075, "output_cost_per_token_batches": 0.00006}, "gpt-5-search-api" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5-search-api", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "gpt-5-search-api-2025-10-14" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5-search-api", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "gpt-5.1" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.1", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125, "input_cost_per_token_priority": 0.0000025, "output_cost_per_token_priority": 0.00002, "cache_read_input_token_cost_priority": 0.00000025}, "gpt-5.1-2025-11-13" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.1", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125, "input_cost_per_token_priority": 0.0000025, "output_cost_per_token_priority": 0.00002, "cache_read_input_token_cost_priority": 0.00000025}, "gpt-5.1-chat" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.1-chat", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "gpt-5.1-chat-2025-11-13" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.1-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125, "input_cost_per_token_priority": 0.0000025, "output_cost_per_token_priority": 0.00002, "cache_read_input_token_cost_priority": 0.00000025}, "gpt-5.1-chat-latest" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.1-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125, "input_cost_per_token_priority": 0.0000025, "output_cost_per_token_priority": 0.00002, "cache_read_input_token_cost_priority": 0.00000025}, "gpt-5.1-codex" : {"mode": "responses", "provider": "openai", "base_model": "gpt-5.1-codex", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125, "input_cost_per_token_priority": 0.0000025, "output_cost_per_token_priority": 0.00002, "cache_read_input_token_cost_priority": 0.00000025}, "gpt-5.1-codex-2025-11-13" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.1-codex", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125, "input_cost_per_token_priority": 0.0000025, "output_cost_per_token_priority": 0.00002, "cache_read_input_token_cost_priority": 0.00000025}, "gpt-5.1-codex-max" : {"mode": "responses", "provider": "openai", "base_model": "gpt-5.1-codex-max", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "gpt-5.1-codex-mini" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.1-codex-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.000000025}, "gpt-5.1-codex-mini-2025-11-13" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.1-codex-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.000000025, "input_cost_per_token_priority": 0.00000045, "output_cost_per_token_priority": 0.0000036, "cache_read_input_token_cost_priority": 0.000000045}, "gpt-5.2" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.2", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175}, "gpt-5.2-2025-12-11" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.2", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175, "input_cost_per_token_priority": 0.0000035, "output_cost_per_token_priority": 0.000028, "cache_read_input_token_cost_priority": 0.00000035}, "gpt-5.2-chat" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.2-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175, "input_cost_per_token_priority": 0.0000035, "output_cost_per_token_priority": 0.000028, "cache_read_input_token_cost_priority": 0.00000035}, "gpt-5.2-chat-2025-12-11" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.2-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175, "input_cost_per_token_priority": 0.0000035, "output_cost_per_token_priority": 0.000028, "cache_read_input_token_cost_priority": 0.00000035}, "gpt-5.2-chat-latest" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.2-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175, "input_cost_per_token_priority": 0.0000035, "output_cost_per_token_priority": 0.000028, "cache_read_input_token_cost_priority": 0.00000035}, "gpt-5.2-codex" : {"mode": "responses", "provider": "openai", "base_model": "gpt-5.2-codex", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175, "input_cost_per_token_priority": 0.0000035, "output_cost_per_token_priority": 0.000028, "cache_read_input_token_cost_priority": 0.00000035}, "gpt-5.2-pro" : {"mode": "responses", "provider": "openai", "base_model": "gpt-5.2-pro", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000021, "output_cost_per_token": 0.000168}, "gpt-5.2-pro-2025-12-11" : {"mode": "responses", "provider": "openai", "base_model": "gpt-5.2-pro", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000021, "output_cost_per_token": 0.000168}, "gpt-5.3-chat" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.3-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175, "input_cost_per_token_priority": 0.0000035, "output_cost_per_token_priority": 0.000028, "cache_read_input_token_cost_priority": 0.00000035}, "gpt-5.3-chat-latest" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.3-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175, "input_cost_per_token_priority": 0.0000035, "output_cost_per_token_priority": 0.000028, "cache_read_input_token_cost_priority": 0.00000035}, "gpt-5.3-codex" : {"mode": "responses", "provider": "github_copilot", "base_model": "gpt-5.3-codex", "max_input_tokens": 400000, "max_output_tokens": 128000}, "gpt-5.3-codex-spark" : {"mode": "responses", "provider": "chatgpt", "base_model": "gpt-5.3-codex-spark", "max_input_tokens": 128000, "max_output_tokens": 128000}, "gpt-5.3-instant" : {"mode": "responses", "provider": "chatgpt", "base_model": "gpt-5.3-instant", "max_input_tokens": 128000, "max_output_tokens": 64000}, "gpt-5.4" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.4", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.00000025, "input_cost_per_token_priority": 0.000005, "output_cost_per_token_priority": 0.00003, "cache_read_input_token_cost_priority": 0.0000005, "input_cost_per_token_above_272k_tokens": 0.000005, "output_cost_per_token_above_272k_tokens": 0.0000225, "cache_read_input_token_cost_above_272k_tokens": 0.0000005, "input_cost_per_token_above_272k_tokens_priority": 0.00001, "output_cost_per_token_above_272k_tokens_priority": 0.000045, "cache_read_input_token_cost_above_272k_tokens_priority": 0.000001}, "gpt-5.4-2026-03-05" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.4", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000015, "input_cost_per_token_flex": 0.00000125, "output_cost_per_token_flex": 0.0000075, "cache_read_input_token_cost": 0.00000025, "input_cost_per_token_batches": 0.00000125, "input_cost_per_token_priority": 0.000005, "output_cost_per_token_batches": 0.0000075, "output_cost_per_token_priority": 0.00003, "cache_read_input_token_cost_flex": 0.00000013, "cache_read_input_token_cost_priority": 0.0000005, "input_cost_per_token_above_272k_tokens": 0.000005, "output_cost_per_token_above_272k_tokens": 0.0000225, "cache_read_input_token_cost_above_272k_tokens": 0.0000005}, "gpt-5.4-mini" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.4-mini", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000075, "output_cost_per_token": 0.0000045, "cache_read_input_token_cost": 0.000000075}, "gpt-5.4-mini-2026-03-17" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.4-mini", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000075, "output_cost_per_token": 0.0000045, "cache_read_input_token_cost": 0.000000075}, "gpt-5.4-nano" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.4-nano", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.00000125, "input_cost_per_token_flex": 0.0000001, "output_cost_per_token_flex": 0.000000625, "cache_read_input_token_cost": 0.00000002, "input_cost_per_token_batches": 0.0000001, "output_cost_per_token_batches": 0.000000625, "cache_read_input_token_cost_flex": 0.00000001}, "gpt-5.4-nano-2026-03-17" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.4-nano", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.00000125, "input_cost_per_token_flex": 0.0000001, "output_cost_per_token_flex": 0.000000625, "cache_read_input_token_cost": 0.00000002, "input_cost_per_token_batches": 0.0000001, "output_cost_per_token_batches": 0.000000625, "cache_read_input_token_cost_flex": 0.00000001}, "gpt-5.4-pro" : {"mode": "responses", "provider": "chatgpt", "base_model": "gpt-5.4-pro", "max_input_tokens": 1050000, "max_output_tokens": 128000}, "gpt-5.4-pro-2026-03-05" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.4-pro", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00018, "cache_read_input_token_cost": 0.000003, "input_cost_per_token_above_272k_tokens": 0.00006, "output_cost_per_token_above_272k_tokens": 0.00027, "cache_read_input_token_cost_above_272k_tokens": 0.000006}, "gpt-5.5" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.5", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00003, "input_cost_per_token_flex": 0.0000025, "output_cost_per_token_flex": 0.000015, "cache_read_input_token_cost": 0.0000005, "input_cost_per_token_batches": 0.0000025, "input_cost_per_token_priority": 0.00001, "output_cost_per_token_batches": 0.000015, "output_cost_per_token_priority": 0.00006, "cache_read_input_token_cost_flex": 0.00000025, "cache_read_input_token_cost_priority": 0.000001, "input_cost_per_token_above_272k_tokens": 0.00001, "output_cost_per_token_above_272k_tokens": 0.000045, "cache_read_input_token_cost_above_272k_tokens": 0.000001}, "gpt-5.5-2026-04-23" : {"mode": "chat", "provider": "openai", "base_model": "gpt-5.5", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00003, "input_cost_per_token_flex": 0.0000025, "output_cost_per_token_flex": 0.000015, "cache_read_input_token_cost": 0.0000005, "input_cost_per_token_batches": 0.0000025, "input_cost_per_token_priority": 0.00001, "output_cost_per_token_batches": 0.000015, "output_cost_per_token_priority": 0.00006, "cache_read_input_token_cost_flex": 0.00000025, "cache_read_input_token_cost_priority": 0.000001, "input_cost_per_token_above_272k_tokens": 0.00001, "output_cost_per_token_above_272k_tokens": 0.000045, "cache_read_input_token_cost_above_272k_tokens": 0.000001}, "gpt-5.5-codex" : {"mode": "responses", "provider": "openai", "base_model": "gpt-5.5-codex", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00003, "cache_read_input_token_cost": 0.0000005}, "gpt-5.5-pro" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.5-pro", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00018, "cache_read_input_token_cost": 0.000003, "input_cost_per_token_above_272k_tokens": 0.00006, "output_cost_per_token_above_272k_tokens": 0.00027, "cache_read_input_token_cost_above_272k_tokens": 0.000006}, "gpt-5.5-pro-2026-04-23" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.5-pro", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00018, "cache_read_input_token_cost": 0.000003, "input_cost_per_token_above_272k_tokens": 0.00006, "output_cost_per_token_above_272k_tokens": 0.00027, "cache_read_input_token_cost_above_272k_tokens": 0.000006}, "gpt-audio" : {"mode": "chat", "provider": "openai", "base_model": "gpt-audio", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.000032, "output_cost_per_audio_token": 0.000064}, "gpt-audio-1.5" : {"mode": "chat", "provider": "openai", "base_model": "gpt-audio-1.5", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.000032, "output_cost_per_audio_token": 0.000064}, "gpt-audio-1.5-2026-02-23" : {"mode": "chat", "provider": "azure", "base_model": "gpt-audio-1.5", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.00004, "output_cost_per_audio_token": 0.00008}, "gpt-audio-2025-08-28" : {"mode": "chat", "provider": "azure", "base_model": "gpt-audio", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "input_cost_per_audio_token": 0.00004, "output_cost_per_audio_token": 0.00008}, "gpt-audio-mini" : {"mode": "chat", "provider": "openai", "base_model": "gpt-audio-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000024, "input_cost_per_audio_token": 0.00001, "output_cost_per_audio_token": 0.00002}, "gpt-audio-mini-2025-10-06" : {"mode": "chat", "provider": "openai", "base_model": "gpt-audio-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000024, "input_cost_per_audio_token": 0.00001, "output_cost_per_audio_token": 0.00002}, "gpt-audio-mini-2025-12-15" : {"mode": "chat", "provider": "openai", "base_model": "gpt-audio-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000024, "input_cost_per_audio_token": 0.00001, "output_cost_per_audio_token": 0.00002}, "gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_token": 0.000005, "input_cost_per_image_token": 0.00001, "cache_read_input_token_cost": 0.00000125, "output_cost_per_image_token": 0.00004, "cache_read_input_image_token_cost": 0.0000025}, "gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_token": 0.000002, "input_cost_per_image_token": 0.0000025, "cache_read_input_token_cost": 0.0000002, "output_cost_per_image_token": 0.000008, "cache_read_input_image_token_cost": 0.00000025}, "gpt-image-1.5" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1.5", "input_cost_per_image": 0.013, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00001, "input_cost_per_image_token": 0.000008, "cache_read_input_token_cost": 0.00000125, "output_cost_per_image_token": 0.000032, "cache_read_input_image_token_cost": 0.000002}, "gpt-image-1.5-2025-12-16" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-1.5", "input_cost_per_image": 0.009, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00001, "input_cost_per_image_token": 0.000008, "cache_read_input_token_cost": 0.00000125, "output_cost_per_image_token": 0.000032, "cache_read_input_image_token_cost": 0.000002}, "gpt-image-2" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-2", "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00001, "input_cost_per_image_token": 0.000008, "cache_read_input_token_cost": 0.00000125, "output_cost_per_image_token": 0.00003, "cache_read_input_image_token_cost": 0.000002}, "gpt-image-2-2026-04-21" : {"mode": "image_generation", "provider": "openai", "base_model": "gpt-image-2", "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00001, "input_cost_per_image_token": 0.000008, "cache_read_input_token_cost": 0.00000125, "output_cost_per_image_token": 0.00003, "cache_read_input_image_token_cost": 0.000002}, "gpt-oss-120b" : {"mode": "chat", "provider": "cerebras", "base_model": "gpt-oss-120b", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000075}, "gpt-oss-120b-mxfp-GGUF" : {"mode": "chat", "provider": "lemonade", "base_model": "gpt-oss-120b", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "gpt-oss-20b" : {"mode": "chat", "provider": "ovhcloud", "base_model": "gpt-oss-20b", "max_input_tokens": 131000, "max_output_tokens": 131000, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000015}, "gpt-oss-20b-mxfp4-GGUF" : {"mode": "chat", "provider": "lemonade", "base_model": "gpt-oss-20b", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "gpt-oss:120b-cloud" : {"mode": "chat", "provider": "ollama", "base_model": "gpt-oss-120b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0, "output_cost_per_token": 0}, "gpt-oss:20b-cloud" : {"mode": "chat", "provider": "ollama", "base_model": "gpt-oss-20b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0, "output_cost_per_token": 0}, "gpt-realtime" : {"mode": "chat", "provider": "openai", "base_model": "gpt-realtime", "max_input_tokens": 32000, "max_output_tokens": 4096, "input_cost_per_image": 0.000005, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000016, "input_cost_per_audio_token": 0.000032, "cache_read_input_token_cost": 0.0000004, "output_cost_per_audio_token": 0.000064, "cache_creation_input_audio_token_cost": 0.0000004}, "gpt-realtime-1.5" : {"mode": "chat", "provider": "openai", "base_model": "gpt-realtime-1.5", "max_input_tokens": 32000, "max_output_tokens": 4096, "input_cost_per_image": 0.000005, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000016, "input_cost_per_audio_token": 0.000032, "cache_read_input_token_cost": 0.0000004, "output_cost_per_audio_token": 0.000064, "cache_creation_input_audio_token_cost": 0.0000004}, "gpt-realtime-1.5-2026-02-23" : {"mode": "chat", "provider": "azure", "base_model": "gpt-realtime-1.5", "max_input_tokens": 32000, "max_output_tokens": 4096, "input_cost_per_image": 0.000005, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000016, "input_cost_per_audio_token": 0.000032, "cache_read_input_token_cost": 0.000004, "output_cost_per_audio_token": 0.000064, "cache_creation_input_audio_token_cost": 0.000004}, "gpt-realtime-2" : {"mode": "chat", "provider": "openai", "base_model": "gpt-realtime-2", "max_input_tokens": 32000, "max_output_tokens": 4096, "input_cost_per_image": 0.000005, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000016, "input_cost_per_audio_token": 0.000032, "cache_read_input_token_cost": 0.0000004, "output_cost_per_audio_token": 0.000064, "cache_creation_input_audio_token_cost": 0.0000004}, "gpt-realtime-2025-08-28" : {"mode": "chat", "provider": "azure", "base_model": "gpt-realtime", "max_input_tokens": 32000, "max_output_tokens": 4096, "input_cost_per_image": 0.000005, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000016, "input_cost_per_audio_token": 0.000032, "cache_read_input_token_cost": 0.000004, "output_cost_per_audio_token": 0.000064, "cache_creation_input_audio_token_cost": 0.000004}, "gpt-realtime-mini" : {"mode": "chat", "provider": "openai", "base_model": "gpt-realtime-mini", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000024, "input_cost_per_audio_token": 0.00001, "output_cost_per_audio_token": 0.00002, "cache_creation_input_audio_token_cost": 0.0000003}, "gpt-realtime-mini-2025-10-06" : {"mode": "chat", "provider": "azure", "base_model": "gpt-realtime-mini", "max_input_tokens": 32000, "max_output_tokens": 4096, "input_cost_per_image": 0.0000008, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000024, "input_cost_per_audio_token": 0.00001, "cache_read_input_token_cost": 0.00000006, "output_cost_per_audio_token": 0.00002, "cache_creation_input_audio_token_cost": 0.0000003}, "gpt-realtime-mini-2025-12-15" : {"mode": "chat", "provider": "openai", "base_model": "gpt-realtime-mini", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_image": 0.0000008, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000024, "input_cost_per_audio_token": 0.00001, "cache_read_input_token_cost": 0.00000006, "output_cost_per_audio_token": 0.00002, "cache_creation_input_audio_token_cost": 0.0000003}, "grok-2" : {"mode": "chat", "provider": "xai", "base_model": "grok-2", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001}, "grok-2-1212" : {"mode": "chat", "provider": "xai", "base_model": "grok-2", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001}, "grok-2-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-2", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001}, "grok-2-vision" : {"mode": "chat", "provider": "xai", "base_model": "grok-2-vision", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_image": 0.000002, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001}, "grok-2-vision-1212" : {"mode": "chat", "provider": "xai", "base_model": "grok-2-vision", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_image": 0.000002, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001}, "grok-2-vision-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-2-vision", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_image": 0.000002, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001}, "grok-3" : {"mode": "chat", "provider": "azure", "base_model": "grok-3", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "grok-3-beta" : {"mode": "chat", "provider": "xai", "base_model": "grok-3", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.00000075}, "grok-3-fast-beta" : {"mode": "chat", "provider": "xai", "base_model": "grok-3-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.00000125}, "grok-3-fast-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-3-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.00000125}, "grok-3-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-3", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.00000075}, "grok-3-mini" : {"mode": "chat", "provider": "azure", "base_model": "grok-3-mini", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000127}, "grok-3-mini-beta" : {"mode": "chat", "provider": "xai", "base_model": "grok-3-mini", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000005, "cache_read_input_token_cost": 0.000000075}, "grok-3-mini-fast" : {"mode": "chat", "provider": "xai", "base_model": "grok-3-mini-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000004, "cache_read_input_token_cost": 0.00000015}, "grok-3-mini-fast-beta" : {"mode": "chat", "provider": "xai", "base_model": "grok-3-mini-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000004, "cache_read_input_token_cost": 0.00000015}, "grok-3-mini-fast-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-3-mini-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000004, "cache_read_input_token_cost": 0.00000015}, "grok-3-mini-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-3-mini", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000005, "cache_read_input_token_cost": 0.000000075}, "grok-4" : {"mode": "chat", "provider": "azure", "base_model": "grok-4", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "grok-4-0709" : {"mode": "chat", "provider": "xai", "base_model": "grok-4", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "input_cost_per_token_above_128k_tokens": 0.000006, "output_cost_per_token_above_128k_tokens": 0.00003}, "grok-4-1-fast" : {"mode": "chat", "provider": "xai", "base_model": "grok-4-1-fast", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000005, "cache_read_input_token_cost": 0.00000005, "input_cost_per_token_above_128k_tokens": 0.0000004, "output_cost_per_token_above_128k_tokens": 0.000001}, "grok-4-1-fast-non-reasoning" : {"mode": "chat", "provider": "azure", "base_model": "grok-4-1-fast-non", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000005}, "grok-4-1-fast-non-reasoning-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-4-1-fast-non", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000005, "cache_read_input_token_cost": 0.00000005, "input_cost_per_token_above_128k_tokens": 0.0000004, "output_cost_per_token_above_128k_tokens": 0.000001}, "grok-4-1-fast-reasoning" : {"mode": "chat", "provider": "azure", "base_model": "grok-4-1-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000005}, "grok-4-1-fast-reasoning-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-4-1-fast", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000005, "cache_read_input_token_cost": 0.00000005, "input_cost_per_token_above_128k_tokens": 0.0000004, "output_cost_per_token_above_128k_tokens": 0.000001}, "grok-4-fast-non-reasoning" : {"mode": "chat", "provider": "azure", "base_model": "grok-4-fast-non", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000005}, "grok-4-fast-reasoning" : {"mode": "chat", "provider": "azure", "base_model": "grok-4-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000005}, "grok-4-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-4", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "input_cost_per_token_above_128k_tokens": 0.000006, "output_cost_per_token_above_128k_tokens": 0.00003}, "grok-4.20-0309-reasoning" : {"mode": "chat", "provider": "xai", "base_model": "grok-4.20", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.0000002}, "grok-4.20-beta-0309-non-reasoning" : {"mode": "chat", "provider": "xai", "base_model": "grok-4.20-beta-0309-non", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.0000002}, "grok-4.20-beta-0309-reasoning" : {"mode": "chat", "provider": "xai", "base_model": "grok-4.20-beta", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.0000002}, "grok-4.20-multi-agent-beta-0309" : {"mode": "chat", "provider": "xai", "base_model": "grok-4.20-multi-agent", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.0000002}, "grok-4.3" : {"mode": "chat", "provider": "xai", "base_model": "grok-4.3", "max_input_tokens": 1000000, "max_output_tokens": 1000000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.0000002, "input_cost_per_token_above_200k_tokens": 0.0000025, "output_cost_per_token_above_200k_tokens": 0.000005, "cache_read_input_token_cost_above_200k_tokens": 0.0000004}, "grok-4.3-latest" : {"mode": "chat", "provider": "xai", "base_model": "grok-4.3", "max_input_tokens": 1000000, "max_output_tokens": 1000000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.0000002, "input_cost_per_token_above_200k_tokens": 0.0000025, "output_cost_per_token_above_200k_tokens": 0.000005, "cache_read_input_token_cost_above_200k_tokens": 0.0000004}, "grok-beta" : {"mode": "chat", "provider": "xai", "base_model": "grok", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015}, "grok-code-fast" : {"mode": "chat", "provider": "xai", "base_model": "grok-code-fast", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000015, "cache_read_input_token_cost": 0.00000002}, "grok-code-fast-1" : {"mode": "chat", "provider": "xai", "base_model": "grok-code-fast-1", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000015, "cache_read_input_token_cost": 0.00000002}, "grok-code-fast-1-0825" : {"mode": "chat", "provider": "xai", "base_model": "grok-code-fast-1", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000015, "cache_read_input_token_cost": 0.00000002}, "grok-vision-beta" : {"mode": "chat", "provider": "xai", "base_model": "grok-vision", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_image": 0.000005, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015}, "gryphe/mythomax-l2-13b" : {"mode": "chat", "provider": "openrouter", "base_model": "mythomax-l2-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001875, "output_cost_per_token": 0.000001875}, "hd/1024-x-1024/dall-e-3" : {"mode": "image_generation", "provider": "azure", "base_model": "dall-e-3", "input_cost_per_pixel": 0.00000007629, "output_cost_per_token": 0}, "hd/1024-x-1792/dall-e-3" : {"mode": "image_generation", "provider": "azure", "base_model": "dall-e-3", "input_cost_per_pixel": 0.00000006539, "output_cost_per_token": 0}, "hd/1792-x-1024/dall-e-3" : {"mode": "image_generation", "provider": "azure", "base_model": "dall-e-3", "input_cost_per_pixel": 0.00000006539, "output_cost_per_token": 0}, "hermes3-405b" : {"mode": "chat", "provider": "lambda_ai", "base_model": "hermes3-405b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000008}, "hermes3-70b" : {"mode": "chat", "provider": "lambda_ai", "base_model": "hermes3-70b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.0000003}, "hermes3-8b" : {"mode": "chat", "provider": "lambda_ai", "base_model": "hermes3-8b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000000025, "output_cost_per_token": 0.00000004}, "hexgrad/kokoro-82m" : {"mode": "chat", "provider": "openrouter", "base_model": "kokoro-82m", "max_input_tokens": 4096, "input_cost_per_token": 0.00000062}, "high/1024-x-1024/gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_pixel": 0.000000159263611, "output_cost_per_pixel": 0}, "high/1024-x-1024/gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_pixel": 0.00000003173828125, "output_cost_per_pixel": 0}, "high/1024-x-1536/gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_pixel": 0.000000158945719, "output_cost_per_pixel": 0}, "high/1024-x-1536/gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_pixel": 0.00000003173828125, "output_cost_per_pixel": 0}, "high/1536-x-1024/gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_pixel": 0.000000158945719, "output_cost_per_pixel": 0}, "high/1536-x-1024/gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_pixel": 0.000000031575520833, "output_cost_per_pixel": 0}, "ibm-granite/granite-3.3-8b-instruct" : {"mode": "chat", "provider": "replicate", "base_model": "granite-3.3-8b-instruct", "input_cost_per_token": 0.00000003, "output_cost_per_token": 0.00000025}, "ibm-granite/granite-4.0-h-micro" : {"mode": "chat", "provider": "openrouter", "base_model": "granite-4.0-h-micro", "max_input_tokens": 131000, "max_output_tokens": 131000, "input_cost_per_token": 0.000000017, "output_cost_per_token": 0.000000112}, "ibm-granite/granite-4.1-8b" : {"mode": "chat", "provider": "openrouter", "base_model": "granite-4.1-8b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000001, "cache_read_input_token_cost": 0.00000005}, "ibm/granite-13b-chat-v2" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-13b-chat-v2", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006}, "ibm/granite-13b-instruct-v2" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-13b-instruct-v2", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006}, "ibm/granite-3-3-8b-instruct" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-3-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "ibm/granite-3-8b-instruct" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "ibm/granite-4-h-small" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-4-h-small", "max_input_tokens": 20480, "max_output_tokens": 20480, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000025}, "ibm/granite-guardian-3-2-2b" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-guardian-3-2-2b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "ibm/granite-guardian-3-3-8b" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-guardian-3-3-8b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "ibm/granite-ttm-1024-96-r2" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-ttm-1024-96-r2", "max_input_tokens": 512, "max_output_tokens": 512, "input_cost_per_token": 0.00000038, "output_cost_per_token": 0.00000038}, "ibm/granite-ttm-1536-96-r2" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-ttm-1536-96-r2", "max_input_tokens": 512, "max_output_tokens": 512, "input_cost_per_token": 0.00000038, "output_cost_per_token": 0.00000038}, "ibm/granite-ttm-512-96-r2" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-ttm-512-96-r2", "max_input_tokens": 512, "max_output_tokens": 512, "input_cost_per_token": 0.00000038, "output_cost_per_token": 0.00000038}, "ibm/granite-vision-3-2-2b" : {"mode": "chat", "provider": "watsonx", "base_model": "granite-vision-3-2-2b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "ideogram-ai/ideogram-v3-turbo" : {"mode": "image_generation", "provider": "replicate", "base_model": "ideogram-ai/ideogram-v3-turbo", "output_cost_per_image": 0.03}, "imagegeneration@006" : {"mode": "image_generation", "provider": "vertex", "base_model": "imagegeneration", "output_cost_per_image": 0.02}, "imagen-3.0-capability-001" : {"mode": "image_generation", "provider": "vertex", "base_model": "imagen-3.0-capability", "output_cost_per_image": 0.04}, "imagen-3.0-fast-generate-001" : {"mode": "image_generation", "provider": "vertex", "base_model": "imagen-3.0-fast-generate", "output_cost_per_image": 0.02}, "imagen-3.0-generate-001" : {"mode": "image_generation", "provider": "gemini", "base_model": "imagen-3.0-generate", "output_cost_per_image": 0.04}, "imagen-3.0-generate-002" : {"mode": "image_generation", "provider": "gemini", "base_model": "imagen-3.0-generate", "output_cost_per_image": 0.04}, "imagen-4.0-fast-generate-001" : {"mode": "image_generation", "provider": "gemini", "base_model": "imagen-4.0-fast-generate", "output_cost_per_image": 0.02}, "imagen-4.0-generate-001" : {"mode": "image_generation", "provider": "gemini", "base_model": "imagen-4.0-generate", "output_cost_per_image": 0.04}, "imagen-4.0-ultra-generate-001" : {"mode": "image_generation", "provider": "vertex", "base_model": "imagen-4.0-ultra-generate", "output_cost_per_image": 0.06}, "inception/mercury-2" : {"mode": "chat", "provider": "openrouter", "base_model": "mercury-2", "max_input_tokens": 128000, "max_output_tokens": 50000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000075, "cache_read_input_token_cost": 0.000000025}, "inception/mercury-coder-small" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "mercury-coder-small", "max_input_tokens": 32000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000001}, "inclusionai/ling-2.6-1t" : {"mode": "chat", "provider": "openrouter", "base_model": "ling-2.6-1t", "max_input_tokens": 262144, "max_output_tokens": 32768, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.000000625, "cache_read_input_token_cost": 0.000000015}, "inclusionai/ling-2.6-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "ling-2.6-flash", "max_input_tokens": 262144, "max_output_tokens": 32768, "input_cost_per_token": 0.00000001, "output_cost_per_token": 0.00000003, "cache_read_input_token_cost": 0.000000002}, "inclusionai/ring-2.6-1t" : {"mode": "chat", "provider": "openrouter", "base_model": "ring-2.6-1t", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.000000625, "cache_read_input_token_cost": 0.000000015}, "inflection/inflection-3-pi" : {"mode": "chat", "provider": "openrouter", "base_model": "inflection-3-pi", "max_input_tokens": 8000, "max_output_tokens": 1024, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "inflection/inflection-3-productivity" : {"mode": "chat", "provider": "openrouter", "base_model": "inflection-3-productivity", "max_input_tokens": 8000, "max_output_tokens": 1024, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "inpaint" : {"mode": "image_edit", "provider": "stability", "base_model": "inpaint", "output_cost_per_image": 0.005}, "internlm2_5-20b-chat" : {"mode": "chat", "provider": "ollama", "base_model": "internlm2-5-20b-chat", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "intfloat/e5-base-v2" : {"mode": "chat", "provider": "openrouter", "base_model": "e5-base-v2", "max_input_tokens": 512, "input_cost_per_token": 0.000000005}, "intfloat/e5-large-v2" : {"mode": "chat", "provider": "openrouter", "base_model": "e5-large-v2", "max_input_tokens": 512, "input_cost_per_token": 0.00000001}, "intfloat/e5-mistral-7b-instruct" : {"mode": "embedding", "provider": "nebius", "base_model": "intfloat/e5-mistral-7b-instruct", "max_input_tokens": 32768, "input_cost_per_token": 0.00000001, "output_cost_per_token": 0}, "intfloat/multilingual-e5-large" : {"mode": "chat", "provider": "openrouter", "base_model": "multilingual-e5-large", "max_input_tokens": 512, "input_cost_per_token": 0.00000001}, "invoke/anthropic.claude-3-5-sonnet-20240620-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "j2-light" : {"mode": "completion", "provider": "ai21", "base_model": "j2-light", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000003}, "j2-mid" : {"mode": "completion", "provider": "ai21", "base_model": "j2-mid", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00001}, "j2-ultra" : {"mode": "completion", "provider": "ai21", "base_model": "j2-ultra", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000015}, "jais-30b-chat" : {"mode": "chat", "provider": "azure", "base_model": "jais-30b-chat", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0032, "output_cost_per_token": 0.00971}, "jamba-1.5" : {"mode": "chat", "provider": "vertex", "base_model": "jamba-1.5", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004}, "jamba-1.5-large" : {"mode": "chat", "provider": "vertex", "base_model": "jamba-1.5-large", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "jamba-1.5-large@001" : {"mode": "chat", "provider": "vertex", "base_model": "jamba-1.5-large", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "jamba-1.5-mini" : {"mode": "chat", "provider": "snowflake", "base_model": "jamba-1.5-mini", "max_input_tokens": 256000, "max_output_tokens": 8192}, "jamba-1.5-mini@001" : {"mode": "chat", "provider": "ai21", "base_model": "jamba-1.5-mini", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004}, "jamba-instruct" : {"mode": "chat", "provider": "snowflake", "base_model": "jamba-instruct", "max_input_tokens": 256000, "max_output_tokens": 8192}, "jamba-large-1.6" : {"mode": "chat", "provider": "ai21", "base_model": "jamba-large-1.6", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "jamba-large-1.7" : {"mode": "chat", "provider": "ai21", "base_model": "jamba-large-1.7", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "jamba-mini-1.6" : {"mode": "chat", "provider": "ai21", "base_model": "jamba-mini-1.6", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004}, "jamba-mini-1.7" : {"mode": "chat", "provider": "ai21", "base_model": "jamba-mini-1.7", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004}, "jina-reranker-v2-base-multilingual" : {"mode": "rerank", "provider": "jina_ai", "base_model": "jina-reranker-v2-base-multilingual", "max_input_tokens": 1024, "max_output_tokens": 1024, "input_cost_per_token": 0.000000018, "output_cost_per_token": 0.000000018}, "jp.anthropic.claude-haiku-4-5-20251001-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000055, "cache_read_input_token_cost": 0.00000011, "cache_creation_input_token_cost": 0.000001375}, "jp.anthropic.claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125, "input_cost_per_token_above_200k_tokens": 0.0000066, "output_cost_per_token_above_200k_tokens": 0.00002475, "cache_read_input_token_cost_above_200k_tokens": 0.00000066, "cache_creation_input_token_cost_above_200k_tokens": 0.00000825}, "jp.anthropic.claude-sonnet-4-6" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-6", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125}, "kimi-k2-0711-preview" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-k2", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.00000015}, "kimi-k2-0905-preview" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-k2", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.00000015}, "kimi-k2-thinking" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.00000015}, "kimi-k2-thinking-251104" : {"mode": "chat", "provider": "volcengine", "base_model": "kimi-k2-thinking", "max_input_tokens": 229376, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "kimi-k2-thinking-turbo" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-k2-thinking-turbo", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000115, "output_cost_per_token": 0.000008, "cache_read_input_token_cost": 0.00000015}, "kimi-k2-turbo-preview" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-k2-turbo", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000115, "output_cost_per_token": 0.000008, "cache_read_input_token_cost": 0.00000015}, "kimi-k2.5" : {"mode": "chat", "provider": "azure", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000003}, "kimi-k2.6" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-k2.6", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000095, "output_cost_per_token": 0.000004, "cache_read_input_token_cost": 0.00000016}, "kimi-k2p5" : {"mode": "chat", "provider": "fireworks", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000003, "cache_read_input_token_cost": 0.0000001}, "kimi-latest" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.00000015}, "kimi-latest-128k" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-latest-128k", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.00000015}, "kimi-latest-32k" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-latest-32k", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003, "cache_read_input_token_cost": 0.00000015}, "kimi-latest-8k" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-latest-8k", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.00000015}, "kimi-thinking-preview" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-thinking", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.00000015}, "kwaipilot/kat-coder-pro" : {"mode": "chat", "provider": "novita", "base_model": "kat-coder-pro", "max_input_tokens": 256000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000006}, "kwaipilot/kat-coder-pro-v2" : {"mode": "chat", "provider": "openrouter", "base_model": "kat-coder-pro-v2", "max_input_tokens": 256000, "max_output_tokens": 80000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000006}, "kwaivgi/kling-v1.6-pro" : {"mode": "video_generation", "provider": "replicate", "base_model": "kwaivgi/kling-v1.6-pro", "output_cost_per_video_per_second": 0.096}, "kwaivgi/kling-v1.6-standard" : {"mode": "video_generation", "provider": "replicate", "base_model": "kwaivgi/kling-v1.6-standard", "output_cost_per_video_per_second": 0.05}, "kwaivgi/kling-v2.0" : {"mode": "video_generation", "provider": "replicate", "base_model": "kwaivgi/kling", "output_cost_per_video_per_second": 0.28}, "kwaivgi/kling-v2.1" : {"mode": "video_generation", "provider": "replicate", "base_model": "kwaivgi/kling", "output_cost_per_video_per_second": 0.05}, "kwaivgi/kling-v2.1-master" : {"mode": "video_generation", "provider": "replicate", "base_model": "kwaivgi/kling-v2.1-master", "output_cost_per_video_per_second": 0.28}, "labs-devstral-small-2512" : {"mode": "chat", "provider": "mistral", "base_model": "labs-devstral-small", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "learnlm-1.5-pro-experimental" : {"mode": "chat", "provider": "gemini", "base_model": "learnlm-1.5-pro", "max_input_tokens": 32767, "max_output_tokens": 8192, "input_cost_per_image": 0, "input_cost_per_token": 0, "output_cost_per_token": 0, "input_cost_per_character": 0, "input_cost_per_audio_per_second": 0, "input_cost_per_video_per_second": 0, "input_cost_per_image_above_128k_tokens": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token_above_128k_tokens": 0, "input_cost_per_audio_per_second_above_128k_tokens": 0, "input_cost_per_video_per_second_above_128k_tokens": 0}, "leonardoai/motion-2.0" : {"mode": "video_generation", "provider": "replicate", "base_model": "leonardoai/motion-2.0", "output_cost_per_video_per_second": 0.06}, "lfm-40b" : {"mode": "chat", "provider": "lambda_ai", "base_model": "lfm-40b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000002}, "lfm-7b" : {"mode": "chat", "provider": "lambda_ai", "base_model": "lfm-7b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000000025, "output_cost_per_token": 0.00000004}, "liquid/lfm-2-24b-a2b" : {"mode": "chat", "provider": "openrouter", "base_model": "lfm-2-24b-a2b", "max_input_tokens": 32768, "input_cost_per_token": 0.00000003, "output_cost_per_token": 0.00000012}, "llama-2-70b-chat" : {"mode": "chat", "provider": "perplexity", "base_model": "llama-2-70b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000028}, "llama-3.1-70b-instruct" : {"mode": "chat", "provider": "perplexity", "base_model": "llama-3.1-70b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001}, "llama-3.1-8b" : {"mode": "chat", "provider": "llamagate", "base_model": "llama-3.1-8b", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0.00000003, "output_cost_per_token": 0.00000005}, "llama-3.1-8b-instant" : {"mode": "chat", "provider": "groq", "base_model": "llama-3.1-8b-instant", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000008}, "llama-3.1-8b-instruct" : {"mode": "chat", "provider": "perplexity", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "llama-3.2-3b" : {"mode": "chat", "provider": "llamagate", "base_model": "llama-3.2-3b", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000008}, "llama-3.3-70b" : {"mode": "chat", "provider": "cerebras", "base_model": "llama-3.3-70b", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000085, "output_cost_per_token": 0.0000012}, "llama-3.3-70b-versatile" : {"mode": "chat", "provider": "groq", "base_model": "llama-3.3-70b-versatile", "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000079}, "llama-4-maverick-17b-128e-instruct-fp8" : {"mode": "chat", "provider": "lambda_ai", "base_model": "llama-4-maverick-17b-128e-instruct-fp8", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000001}, "llama-4-scout-17b-16e-instruct" : {"mode": "chat", "provider": "lambda_ai", "base_model": "llama-4-scout-17b-16e-instruct", "max_input_tokens": 16384, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000001}, "llama2" : {"mode": "chat", "provider": "ollama", "base_model": "llama-2", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "llama2-70b-chat" : {"mode": "chat", "provider": "snowflake", "base_model": "llama-2-70b-chat", "max_input_tokens": 4096, "max_output_tokens": 8192}, "llama2-uncensored" : {"mode": "completion", "provider": "ollama", "base_model": "llama-2-uncensored", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "llama2:13b" : {"mode": "chat", "provider": "ollama", "base_model": "llama-2-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "llama2:70b" : {"mode": "chat", "provider": "ollama", "base_model": "llama-2-70b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "llama2:7b" : {"mode": "chat", "provider": "ollama", "base_model": "llama-2-7b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "llama3" : {"mode": "chat", "provider": "ollama", "base_model": "llama-3", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "llama3-70b" : {"mode": "chat", "provider": "snowflake", "base_model": "llama-3-70b", "max_input_tokens": 8000, "max_output_tokens": 8192}, "llama3-8b" : {"mode": "chat", "provider": "snowflake", "base_model": "llama-3-8b", "max_input_tokens": 8000, "max_output_tokens": 8192}, "llama3-8b-instruct" : {"mode": "chat", "provider": "gradient_ai", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 512, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "llama3.1" : {"mode": "chat", "provider": "ollama", "base_model": "llama-3.1", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "llama3.1-405b" : {"mode": "chat", "provider": "snowflake", "base_model": "llama-3.1-405b", "max_input_tokens": 128000, "max_output_tokens": 8192}, "llama3.1-405b-instruct-fp8" : {"mode": "chat", "provider": "lambda_ai", "base_model": "llama-3.1-405b-instruct-fp8", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000008}, "llama3.1-70b" : {"mode": "chat", "provider": "snowflake", "base_model": "llama-3.1-70b", "max_input_tokens": 128000, "max_output_tokens": 8192}, "llama3.1-70b-instruct-fp8" : {"mode": "chat", "provider": "lambda_ai", "base_model": "llama-3.1-70b-instruct-fp8", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.0000003}, "llama3.1-8b" : {"mode": "chat", "provider": "snowflake", "base_model": "llama-3.1-8b", "max_input_tokens": 128000, "max_output_tokens": 8192}, "llama3.1-8b-instruct" : {"mode": "chat", "provider": "lambda_ai", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000000025, "output_cost_per_token": 0.00000004}, "llama3.1-nemotron-70b-instruct-fp8" : {"mode": "chat", "provider": "lambda_ai", "base_model": "llama-3.1-nemotron-70b-instruct-fp8", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.0000003}, "llama3.2-11b-vision-instruct" : {"mode": "chat", "provider": "lambda_ai", "base_model": "llama-3.2-11b-vision-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000000015, "output_cost_per_token": 0.000000025}, "llama3.2-1b" : {"mode": "chat", "provider": "snowflake", "base_model": "llama-3.2-1b", "max_input_tokens": 128000, "max_output_tokens": 8192}, "llama3.2-3b" : {"mode": "chat", "provider": "snowflake", "base_model": "llama-3.2-3b", "max_input_tokens": 128000, "max_output_tokens": 8192}, "llama3.2-3b-instruct" : {"mode": "chat", "provider": "lambda_ai", "base_model": "llama-3.2-3b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000000015, "output_cost_per_token": 0.000000025}, "llama3.3-70b" : {"mode": "chat", "provider": "snowflake", "base_model": "llama-3.3-70b", "max_input_tokens": 128000, "max_output_tokens": 8192}, "llama3.3-70b-instruct" : {"mode": "chat", "provider": "gradient_ai", "base_model": "llama-3.3-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000065}, "llama3.3-70b-instruct-fp8" : {"mode": "chat", "provider": "lambda_ai", "base_model": "llama-3.3-70b-instruct-fp8", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.0000003}, "llama3:70b" : {"mode": "chat", "provider": "ollama", "base_model": "llama-3-70b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "llama3:8b" : {"mode": "chat", "provider": "ollama", "base_model": "llama-3-8b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "llava-7b" : {"mode": "chat", "provider": "llamagate", "base_model": "llava-7b", "max_input_tokens": 4096, "max_output_tokens": 2048, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000002}, "llava-v1.6-mistral-7b-hf" : {"mode": "chat", "provider": "ovhcloud", "base_model": "llava-v1.6-mistral-7b", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000029, "output_cost_per_token": 0.00000029}, "long-form" : {"mode": "audio_speech", "provider": "aws_polly", "base_model": "long-form", "input_cost_per_character": 0.0001}, "low/1024-x-1024/gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_pixel": 0.000000010490417, "output_cost_per_pixel": 0}, "low/1024-x-1024/gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_pixel": 0.0000000020751953125, "output_cost_per_pixel": 0}, "low/1024-x-1536/gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_pixel": 0.000000010172526, "output_cost_per_pixel": 0}, "low/1024-x-1536/gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_pixel": 0.0000000020751953125, "output_cost_per_pixel": 0}, "low/1536-x-1024/gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_pixel": 0.000000010172526, "output_cost_per_pixel": 0}, "low/1536-x-1024/gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_pixel": 0.0000000020345052083, "output_cost_per_pixel": 0}, "luma/ray-2-540p" : {"mode": "video_generation", "provider": "replicate", "base_model": "luma/ray-2-540p", "output_cost_per_video_per_second": 0.1}, "luma/ray-2-720p" : {"mode": "video_generation", "provider": "replicate", "base_model": "luma/ray-2-720p", "output_cost_per_video_per_second": 0.18}, "luma/ray-flash-2-540p" : {"mode": "video_generation", "provider": "replicate", "base_model": "luma/ray-flash-2-540p", "output_cost_per_video_per_second": 0.034}, "luma/ray-flash-2-720p" : {"mode": "video_generation", "provider": "replicate", "base_model": "luma/ray-flash-2-720p", "output_cost_per_video_per_second": 0.06}, "lyria-3-clip-preview" : {"mode": "chat", "provider": "gemini", "base_model": "lyria-3-clip", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_image": 0.04, "output_cost_per_token": 0}, "lyria-3-pro-preview" : {"mode": "chat", "provider": "gemini", "base_model": "lyria-3-pro", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "magistral-medium-1-2-2509" : {"mode": "chat", "provider": "mistral", "base_model": "magistral-medium-1-2", "max_input_tokens": 40000, "max_output_tokens": 40000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005}, "magistral-medium-2506" : {"mode": "chat", "provider": "mistral", "base_model": "magistral-medium", "max_input_tokens": 40000, "max_output_tokens": 40000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005}, "magistral-medium-2509" : {"mode": "chat", "provider": "mistral", "base_model": "magistral-medium", "max_input_tokens": 40000, "max_output_tokens": 40000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005}, "magistral-medium-latest" : {"mode": "chat", "provider": "mistral", "base_model": "magistral-medium", "max_input_tokens": 40000, "max_output_tokens": 40000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005}, "magistral-small-1-2-2509" : {"mode": "chat", "provider": "mistral", "base_model": "magistral-small-1-2", "max_input_tokens": 40000, "max_output_tokens": 40000, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "magistral-small-2506" : {"mode": "chat", "provider": "mistral", "base_model": "magistral-small", "max_input_tokens": 40000, "max_output_tokens": 40000, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "magistral-small-latest" : {"mode": "chat", "provider": "mistral", "base_model": "magistral-small", "max_input_tokens": 40000, "max_output_tokens": 40000, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "mamba-codestral-7B-v0.1" : {"mode": "chat", "provider": "ovhcloud", "base_model": "mamba-codestral-7b", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.00000019, "output_cost_per_token": 0.00000019}, "mancer/weaver" : {"mode": "chat", "provider": "openrouter", "base_model": "weaver", "max_input_tokens": 8000, "max_output_tokens": 2000, "input_cost_per_token": 0.000005625, "output_cost_per_token": 0.000005625}, "max-steps/stability.stable-diffusion-xl-v0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "stable-diffusion-xl-v0", "max_input_tokens": 77, "output_cost_per_image": 0.036}, "max-steps/stability.stable-diffusion-xl-v1" : {"mode": "image_generation", "provider": "bedrock", "base_model": "stable-diffusion-xl-v1", "max_input_tokens": 77, "output_cost_per_image": 0.08}, "medium/1024-x-1024/gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_pixel": 0.000000040054321, "output_cost_per_pixel": 0}, "medium/1024-x-1024/gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_pixel": 0.000000008056640625, "output_cost_per_pixel": 0}, "medium/1024-x-1536/gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_pixel": 0.000000040054321, "output_cost_per_pixel": 0}, "medium/1024-x-1536/gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_pixel": 0.000000008056640625, "output_cost_per_pixel": 0}, "medium/1536-x-1024/gpt-image-1" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1", "input_cost_per_pixel": 0.000000040054321, "output_cost_per_pixel": 0}, "medium/1536-x-1024/gpt-image-1-mini" : {"mode": "image_generation", "provider": "azure", "base_model": "gpt-image-1-mini", "input_cost_per_pixel": 0.0000000079752604167, "output_cost_per_pixel": 0}, "medlm-large" : {"mode": "chat", "provider": "vertex", "base_model": "medlm-large", "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_character": 0.000005}, "medlm-medium" : {"mode": "chat", "provider": "vertex", "base_model": "medlm-medium", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_character": 0.0000005}, "meta-llama-3.1-70b-instruct" : {"mode": "chat", "provider": "friendliai", "base_model": "llama-3.1-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006}, "meta-llama-3.1-8b-instruct" : {"mode": "chat", "provider": "friendliai", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "meta-llama/Llama-2-13b-chat-hf" : {"mode": "chat", "provider": "anyscale", "base_model": "llama-2-13b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025}, "meta-llama/Llama-2-70b-chat-hf" : {"mode": "chat", "provider": "anyscale", "base_model": "llama-2-70b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001}, "meta-llama/Llama-2-7b-chat-hf" : {"mode": "chat", "provider": "anyscale", "base_model": "llama-2-7b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "meta-llama/Llama-3.1-8B-Instruct" : {"mode": "chat", "provider": "wandb", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.022, "output_cost_per_token": 0.022}, "meta-llama/Llama-3.2-11B-Vision-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "llama-3.2-11b-vision-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000000049, "output_cost_per_token": 0.000000049}, "meta-llama/Llama-3.2-3B-Instruct" : {"mode": "chat", "provider": "hyperbolic", "base_model": "llama-3.2-3b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.0000003}, "meta-llama/Llama-3.2-3B-Instruct-Turbo" : {"mode": "chat", "provider": "together_ai", "base_model": "llama-3.2-3b-instruct-turbo"}, "meta-llama/Llama-3.3-70B-Instruct" : {"mode": "chat", "provider": "nscale", "base_model": "llama-3.3-70b-instruct", "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "meta-llama/Llama-3.3-70B-Instruct-Turbo" : {"mode": "chat", "provider": "deepinfra", "base_model": "llama-3.3-70b-instruct-turbo", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000039}, "meta-llama/Llama-3.3-70B-Instruct-Turbo-Free" : {"mode": "chat", "provider": "together_ai", "base_model": "llama-3.3-70b-instruct-turbo-free", "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8" : {"mode": "chat", "provider": "together_ai", "base_model": "llama-4-maverick-17b-128e-instruct-fp8", "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.00000085}, "meta-llama/Llama-4-Scout-17B-16E-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "llama-4-scout-17b-16e-instruct", "max_input_tokens": 327680, "max_output_tokens": 327680, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.0000003}, "meta-llama/Llama-Guard-3-8B" : {"mode": "chat", "provider": "deepinfra", "base_model": "llama-guard-3-8b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000000055, "output_cost_per_token": 0.000000055}, "meta-llama/Llama-Guard-4-12B" : {"mode": "chat", "provider": "deepinfra", "base_model": "llama-guard-4-12b", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000018}, "meta-llama/Meta-Llama-3-70B-Instruct" : {"mode": "chat", "provider": "anyscale", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001}, "meta-llama/Meta-Llama-3-8B-Instruct" : {"mode": "chat", "provider": "anyscale", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "meta-llama/Meta-Llama-3.1-405B-Instruct" : {"mode": "chat", "provider": "nebius", "base_model": "llama-3.1-405b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo" : {"mode": "chat", "provider": "together_ai", "base_model": "llama-3.1-405b-instruct-turbo", "input_cost_per_token": 0.0000035, "output_cost_per_token": 0.0000035}, "meta-llama/Meta-Llama-3.1-70B-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "llama-3.1-70b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000004}, "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo" : {"mode": "chat", "provider": "together_ai", "base_model": "llama-3.1-70b-instruct-turbo", "input_cost_per_token": 0.00000088, "output_cost_per_token": 0.00000088}, "meta-llama/Meta-Llama-3.1-8B-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000003, "output_cost_per_token": 0.00000005}, "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo" : {"mode": "chat", "provider": "together_ai", "base_model": "llama-3.1-8b-instruct-turbo", "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000018}, "meta-llama/llama-3-2-11b-vision-instruct" : {"mode": "chat", "provider": "watsonx", "base_model": "llama-3-2-11b-vision-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000035}, "meta-llama/llama-3-2-1b-instruct" : {"mode": "chat", "provider": "watsonx", "base_model": "llama-3-2-1b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "meta-llama/llama-3-2-3b-instruct" : {"mode": "chat", "provider": "watsonx", "base_model": "llama-3-2-3b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "meta-llama/llama-3-2-90b-vision-instruct" : {"mode": "chat", "provider": "watsonx", "base_model": "llama-3-2-90b-vision-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002}, "meta-llama/llama-3-3-70b-instruct" : {"mode": "chat", "provider": "watsonx", "base_model": "llama-3-3-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000071, "output_cost_per_token": 0.00000071}, "meta-llama/llama-3-70b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8000, "input_cost_per_token": 0.00000051, "output_cost_per_token": 0.00000074}, "meta-llama/llama-3-8b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000004}, "meta-llama/llama-3.1-70b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "llama-3.1-70b-instruct", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000004}, "meta-llama/llama-3.1-8b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0.00000005}, "meta-llama/llama-3.2-11b-vision-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "llama-3.2-11b-vision-instruct", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.000000245, "output_cost_per_token": 0.000000245}, "meta-llama/llama-3.2-1b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "llama-3.2-1b-instruct", "max_input_tokens": 60000, "max_output_tokens": 60000, "input_cost_per_token": 0.000000027, "output_cost_per_token": 0.000000201}, "meta-llama/llama-3.2-3b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "llama-3.2-3b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32000, "input_cost_per_token": 0.00000003, "output_cost_per_token": 0.00000005}, "meta-llama/llama-3.3-70b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "llama-3.3-70b-instruct", "max_input_tokens": 131072, "max_output_tokens": 120000, "input_cost_per_token": 0.000000135, "output_cost_per_token": 0.0000004}, "meta-llama/llama-4-maverick" : {"mode": "chat", "provider": "openrouter", "base_model": "llama-4-maverick", "max_input_tokens": 1048576, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "meta-llama/llama-4-maverick-17b" : {"mode": "chat", "provider": "watsonx", "base_model": "llama-4-maverick-17b", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.0000014}, "meta-llama/llama-4-maverick-17b-128e-instruct" : {"mode": "chat", "provider": "groq", "base_model": "llama-4-maverick-17b-128e-instruct", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "meta-llama/llama-4-maverick-17b-128e-instruct-fp8" : {"mode": "chat", "provider": "novita", "base_model": "llama-4-maverick-17b-128e-instruct-fp8", "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.00000085}, "meta-llama/llama-4-scout" : {"mode": "chat", "provider": "openrouter", "base_model": "llama-4-scout", "max_input_tokens": 327680, "max_output_tokens": 16384, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.0000003}, "meta-llama/llama-4-scout-17b-16e-instruct" : {"mode": "chat", "provider": "novita", "base_model": "llama-4-scout-17b-16e-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000059}, "meta-llama/llama-guard-3-11b-vision" : {"mode": "chat", "provider": "watsonx", "base_model": "llama-guard-3-11b-vision", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000035}, "meta-llama/llama-guard-3-8b" : {"mode": "chat", "provider": "openrouter", "base_model": "llama-guard-3-8b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000000484, "output_cost_per_token": 0.00000003}, "meta-llama/llama-guard-4-12b" : {"mode": "chat", "provider": "openrouter", "base_model": "llama-guard-4-12b", "max_input_tokens": 163840, "max_output_tokens": 16384, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000018}, "meta-textgeneration-llama-2-13b" : {"mode": "completion", "provider": "sagemaker", "base_model": "llama-2-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta-textgeneration-llama-2-13b-f" : {"mode": "chat", "provider": "sagemaker", "base_model": "llama-2-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta-textgeneration-llama-2-70b" : {"mode": "completion", "provider": "sagemaker", "base_model": "llama-2-70b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta-textgeneration-llama-2-70b-b-f" : {"mode": "chat", "provider": "sagemaker", "base_model": "llama-2-70b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta-textgeneration-llama-2-7b" : {"mode": "completion", "provider": "sagemaker", "base_model": "llama-2-7b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta-textgeneration-llama-2-7b-f" : {"mode": "chat", "provider": "sagemaker", "base_model": "llama-2-7b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta.llama-3.1-405b-instruct" : {"mode": "chat", "provider": "oci", "base_model": "llama-3.1-405b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00001068, "output_cost_per_token": 0.00001068}, "meta.llama-3.1-70b-instruct" : {"mode": "chat", "provider": "oci", "base_model": "llama-3.1-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "meta.llama-3.2-11b-vision-instruct" : {"mode": "chat", "provider": "oci", "base_model": "llama-3.2-11b-vision-instruct", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002}, "meta.llama-3.2-90b-vision-instruct" : {"mode": "chat", "provider": "oci", "base_model": "llama-3.2-90b-vision-instruct", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002}, "meta.llama-3.3-70b-instruct" : {"mode": "chat", "provider": "oci", "base_model": "llama-3.3-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "meta.llama-3.3-70b-instruct-fp8-dynamic" : {"mode": "chat", "provider": "oci", "base_model": "llama-3.3-70b-instruct-fp8-dynamic", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "meta.llama-4-maverick-17b-128e-instruct-fp8" : {"mode": "chat", "provider": "oci", "base_model": "llama-4-maverick-17b-128e-instruct-fp8", "max_input_tokens": 512000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "meta.llama-4-scout-17b-16e-instruct" : {"mode": "chat", "provider": "oci", "base_model": "llama-4-scout-17b-16e-instruct", "max_input_tokens": 192000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "meta.llama2-13b-chat-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-2-13b-chat-v1", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000075, "output_cost_per_token": 0.000001}, "meta.llama2-70b-chat-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-2-70b-chat-v1", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000195, "output_cost_per_token": 0.00000256}, "meta.llama3-1-405b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-1-405b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000532, "output_cost_per_token": 0.000016}, "meta.llama3-1-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-1-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000099, "output_cost_per_token": 0.00000099}, "meta.llama3-1-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-1-8b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000022}, "meta.llama3-2-11b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-11b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000035}, "meta.llama3-2-1b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-1b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "meta.llama3-2-3b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-3b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "meta.llama3-2-90b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-90b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002}, "meta.llama3-3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-3-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000265, "output_cost_per_token": 0.0000035}, "meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006}, "meta.llama4-maverick-17b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-4-maverick-17b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000024, "output_cost_per_token": 0.00000097, "input_cost_per_token_batches": 0.00000012, "output_cost_per_token_batches": 0.000000485}, "meta.llama4-scout-17b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-4-scout-17b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000017, "output_cost_per_token": 0.00000066, "input_cost_per_token_batches": 0.000000085, "output_cost_per_token_batches": 0.00000033}, "meta/llama-2-13b" : {"mode": "chat", "provider": "replicate", "base_model": "llama-2-13b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000005}, "meta/llama-2-13b-chat" : {"mode": "chat", "provider": "replicate", "base_model": "llama-2-13b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000005}, "meta/llama-2-70b" : {"mode": "chat", "provider": "replicate", "base_model": "llama-2-70b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000275}, "meta/llama-2-70b-chat" : {"mode": "chat", "provider": "replicate", "base_model": "llama-2-70b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000275}, "meta/llama-2-7b" : {"mode": "chat", "provider": "replicate", "base_model": "llama-2-7b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025}, "meta/llama-2-7b-chat" : {"mode": "chat", "provider": "replicate", "base_model": "llama-2-7b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025}, "meta/llama-3-70b" : {"mode": "chat", "provider": "replicate", "base_model": "llama-3-70b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000275}, "meta/llama-3-70b-instruct" : {"mode": "chat", "provider": "replicate", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000275}, "meta/llama-3-8b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-3-8b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000008}, "meta/llama-3-8b-instruct" : {"mode": "chat", "provider": "replicate", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8086, "max_output_tokens": 8086, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025}, "meta/llama-3.1-405b-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-3.1-405b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000016}, "meta/llama-3.1-70b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-3.1-70b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "meta/llama-3.1-70b-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-3.1-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta/llama-3.1-8b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-3.1-8b", "max_input_tokens": 131000, "max_output_tokens": 131072, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000008}, "meta/llama-3.1-8b-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-3.1-8b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta/llama-3.2-11b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-3.2-11b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000016, "output_cost_per_token": 0.00000016}, "meta/llama-3.2-1b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-3.2-1b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "meta/llama-3.2-3b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-3.2-3b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "meta/llama-3.2-90b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-3.2-90b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "meta/llama-3.2-90b-vision-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-3.2-90b-vision-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta/llama-3.3-70b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-3.3-70b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "meta/llama-4-maverick" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-4-maverick", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "meta/llama-4-maverick-17b-128e-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-4-maverick-17b-128e-instruct", "max_input_tokens": 1000000, "max_output_tokens": 1000000, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000115}, "meta/llama-4-maverick-17b-16e-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-4-maverick-17b-16e-instruct", "max_input_tokens": 1000000, "max_output_tokens": 1000000, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000115}, "meta/llama-4-scout" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "llama-4-scout", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "meta/llama-4-scout-17b-128e-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-4-scout-17b-128e-instruct", "max_input_tokens": 10000000, "max_output_tokens": 10000000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.0000007}, "meta/llama-4-scout-17b-16e-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-4-scout-17b-16e-instruct", "max_input_tokens": 10000000, "max_output_tokens": 10000000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.0000007}, "meta/llama3-405b-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-3-405b-instruct", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta/llama3-70b-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-3-70b-instruct", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "meta/llama3-8b-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "llama-3-8b-instruct", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "microsoft/Phi-4-mini-instruct" : {"mode": "chat", "provider": "wandb", "base_model": "phi-4-mini-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.008, "output_cost_per_token": 0.035}, "microsoft/WizardLM-2-8x22B" : {"mode": "chat", "provider": "deepinfra", "base_model": "wizardlm-2-8x22b", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.00000048, "output_cost_per_token": 0.00000048}, "microsoft/mai-image-2.5" : {"mode": "image_generation", "provider": "openrouter", "base_model": "mai-image-2.5", "max_input_tokens": 4096, "max_output_tokens": 1024, "input_cost_per_token": 0.000005}, "microsoft/mai-transcribe-1.5" : {"mode": "chat", "provider": "openrouter", "base_model": "mai-transcribe-1.5", "max_input_tokens": 0, "input_cost_per_token": 0.36}, "microsoft/mai-voice-2" : {"mode": "chat", "provider": "openrouter", "base_model": "mai-voice-2", "max_input_tokens": 0, "input_cost_per_token": 0.000022}, "microsoft/phi-4" : {"mode": "chat", "provider": "deepinfra", "base_model": "phi-4", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000014}, "microsoft/phi-4-mini-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "phi-4-mini-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000035, "cache_read_input_token_cost": 0.00000008}, "microsoft/wizardlm-2-8x22b" : {"mode": "chat", "provider": "novita", "base_model": "wizardlm-2-8x22b", "max_input_tokens": 65535, "max_output_tokens": 8000, "input_cost_per_token": 0.00000062, "output_cost_per_token": 0.00000062}, "minimax-m2p1" : {"mode": "chat", "provider": "fireworks", "base_model": "minimax-m2.1", "max_input_tokens": 204800, "max_output_tokens": 204800, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000003}, "minimax.minimax-m2" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "minimax/hailuo-02" : {"mode": "video_generation", "provider": "replicate", "base_model": "hailuo-02", "output_cost_per_video_per_second": 0.017}, "minimax/hailuo-02-fast" : {"mode": "video_generation", "provider": "replicate", "base_model": "hailuo-02-fast", "output_cost_per_video_per_second": 0.015}, "minimax/minimax-01" : {"mode": "chat", "provider": "openrouter", "base_model": "minimax-01", "max_input_tokens": 1000192, "max_output_tokens": 1000192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000011}, "minimax/minimax-m1" : {"mode": "chat", "provider": "openrouter", "base_model": "minimax-m1", "max_input_tokens": 1000000, "max_output_tokens": 40000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000022}, "minimax/minimax-m2" : {"mode": "chat", "provider": "openrouter", "base_model": "minimax-m2", "max_input_tokens": 204800, "max_output_tokens": 204800, "input_cost_per_token": 0.000000255, "output_cost_per_token": 0.00000102, "cache_read_input_token_cost": 0.00000003}, "minimax/minimax-m2-her" : {"mode": "chat", "provider": "openrouter", "base_model": "minimax-m2-her", "max_input_tokens": 65536, "max_output_tokens": 2048, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000003}, "minimax/minimax-m2.1" : {"mode": "chat", "provider": "openrouter", "base_model": "minimax-m2.1", "max_input_tokens": 204000, "max_output_tokens": 64000, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0, "cache_creation_input_token_cost": 0}, "minimax/minimax-m2.5" : {"mode": "chat", "provider": "openrouter", "base_model": "minimax-m2.5", "max_input_tokens": 196608, "max_output_tokens": 65536, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000011, "cache_read_input_token_cost": 0.00000015}, "minimax/minimax-m2.7" : {"mode": "chat", "provider": "openrouter", "base_model": "minimax-m2.7", "max_input_tokens": 196608, "max_output_tokens": 196608, "input_cost_per_token": 0.000000279, "output_cost_per_token": 0.0000012}, "minimax/minimax-m3" : {"mode": "chat", "provider": "openrouter", "base_model": "minimax-m3", "max_input_tokens": 524288, "max_output_tokens": 512000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "cache_read_input_token_cost": 0.00000006}, "minimax/video-01" : {"mode": "video_generation", "provider": "replicate", "base_model": "video-01", "output_cost_per_video_per_second": 0.1}, "minimax/video-01-director" : {"mode": "video_generation", "provider": "replicate", "base_model": "video-01-director", "output_cost_per_video_per_second": 0.1}, "minimax/video-01-live" : {"mode": "video_generation", "provider": "replicate", "base_model": "video-01-live", "output_cost_per_video_per_second": 0.1}, "minimaxai/minimax-m1-80k" : {"mode": "chat", "provider": "novita", "base_model": "minimax-m1-80k", "max_input_tokens": 1000000, "max_output_tokens": 40000, "input_cost_per_token": 0.00000055, "output_cost_per_token": 0.0000022}, "minimaxai/minimax-m2-maas" : {"mode": "chat", "provider": "vertex", "base_model": "minimax-m2", "max_input_tokens": 196608, "max_output_tokens": 196608, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "ministral-3-14b-2512" : {"mode": "chat", "provider": "mistral", "base_model": "ministral-3-14b", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "ministral-3-3b-2512" : {"mode": "chat", "provider": "mistral", "base_model": "ministral-3-3b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "ministral-3-8b-2512" : {"mode": "chat", "provider": "mistral", "base_model": "ministral-3-8b", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "ministral-3b" : {"mode": "chat", "provider": "azure", "base_model": "ministral-3b", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000004}, "ministral-8b-2512" : {"mode": "chat", "provider": "mistral", "base_model": "ministral-8b", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "mistral" : {"mode": "completion", "provider": "ollama", "base_model": "mistral", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "mistral-7B-Instruct-v0.1" : {"mode": "chat", "provider": "ollama", "base_model": "mistral-7b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "mistral-7B-Instruct-v0.2" : {"mode": "chat", "provider": "ollama", "base_model": "mistral-7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "mistral-7b" : {"mode": "chat", "provider": "snowflake", "base_model": "mistral-7b", "max_input_tokens": 32000, "max_output_tokens": 8192}, "mistral-7b-instruct" : {"mode": "chat", "provider": "perplexity", "base_model": "mistral-7b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028}, "mistral-7b-v0.3" : {"mode": "chat", "provider": "llamagate", "base_model": "mistral-7b", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.00000015}, "mistral-document-ai-2505" : {"mode": "ocr", "provider": "azure", "base_model": "mistral-document-ai", "ocr_cost_per_page": 0.003}, "mistral-document-ai-2512" : {"mode": "ocr", "provider": "azure", "base_model": "mistral-document-ai", "ocr_cost_per_page": 0.003}, "mistral-embed" : {"mode": "embedding", "provider": "mistral", "base_model": "mistral-embed", "max_input_tokens": 8192, "input_cost_per_token": 0.0000001}, "mistral-large" : {"mode": "chat", "provider": "azure", "base_model": "mistral-large", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000012}, "mistral-large-2402" : {"mode": "chat", "provider": "azure", "base_model": "mistral-large", "max_input_tokens": 32000, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "mistral-large-2407" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-large", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000009}, "mistral-large-2411" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-large", "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "mistral-large-2512" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-large", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "mistral-large-3" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-large-3", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "mistral-large-instruct-2407" : {"mode": "chat", "provider": "ollama", "base_model": "mistral-large-instruct", "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0}, "mistral-large-latest" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-large", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "mistral-large2" : {"mode": "chat", "provider": "snowflake", "base_model": "mistral-large", "max_input_tokens": 128000, "max_output_tokens": 8192}, "mistral-large@2407" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-large", "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "mistral-large@2411-001" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-large", "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "mistral-large@latest" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-large", "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "mistral-medium" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-medium", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000027, "output_cost_per_token": 0.0000081}, "mistral-medium-2312" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-medium", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000027, "output_cost_per_token": 0.0000081}, "mistral-medium-2505" : {"mode": "chat", "provider": "azure", "base_model": "mistral-medium", "max_input_tokens": 131072, "max_output_tokens": 8191, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "mistral-medium-3" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-medium-3", "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "mistral-medium-3-1-2508" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-medium-3-1", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "mistral-medium-3@001" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-medium-3", "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "mistral-medium-latest" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-medium", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "mistral-nemo" : {"mode": "chat", "provider": "azure", "base_model": "mistral-nemo", "max_input_tokens": 131072, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "mistral-nemo-instruct-2407" : {"mode": "chat", "provider": "gradient_ai", "base_model": "mistral-nemo-instruct", "max_input_tokens": 128000, "max_output_tokens": 512, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000003}, "mistral-nemo@2407" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-nemo", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000003}, "mistral-nemo@latest" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-nemo", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "mistral-ocr-2505" : {"mode": "ocr", "provider": "vertex", "base_model": "mistral-ocr", "ocr_cost_per_page": 0.0005}, "mistral-ocr-2505-completion" : {"mode": "ocr", "provider": "mistral", "base_model": "mistral-ocr-2505-completion", "ocr_cost_per_page": 0.001, "annotation_cost_per_page": 0.003}, "mistral-ocr-latest" : {"mode": "ocr", "provider": "mistral", "base_model": "mistral-ocr", "ocr_cost_per_page": 0.001, "annotation_cost_per_page": 0.003}, "mistral-small" : {"mode": "chat", "provider": "azure", "base_model": "mistral-small", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "mistral-small-2503" : {"mode": "chat", "provider": "azure", "base_model": "mistral-small", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "mistral-small-2503@001" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-small", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "mistral-small-3-2-2506" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-small-3-2", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000018}, "mistral-small-latest" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-small", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000018}, "mistral-tiny" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-tiny", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025}, "mistral.devstral-2-123b" : {"mode": "chat", "provider": "bedrock", "base_model": "devstral-2-123b", "max_input_tokens": 256000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "mistral.magistral-small-2509" : {"mode": "chat", "provider": "bedrock", "base_model": "magistral-small", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "mistral.ministral-3-14b-instruct" : {"mode": "chat", "provider": "bedrock", "base_model": "ministral-3-14b-instruct", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "mistral.ministral-3-3b-instruct" : {"mode": "chat", "provider": "bedrock", "base_model": "ministral-3-3b-instruct", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "mistral.ministral-3-8b-instruct" : {"mode": "chat", "provider": "bedrock", "base_model": "ministral-3-8b-instruct", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "mistral.mistral-7b-instruct-v0:2" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000002}, "mistral.mistral-large-2402-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-large", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "mistral.mistral-large-2407-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-large", "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000009}, "mistral.mistral-large-3-675b-instruct" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-large-3-675b-instruct", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "mistral.mistral-small-2402-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-small", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "mistral.mixtral-8x7b-instruct-v0:1" : {"mode": "chat", "provider": "bedrock", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000007}, "mistral.voxtral-mini-3b-2507" : {"mode": "chat", "provider": "bedrock", "base_model": "voxtral-mini-3b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000004}, "mistral.voxtral-small-24b-2507" : {"mode": "chat", "provider": "bedrock", "base_model": "voxtral-small-24b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "mistral/codestral" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "codestral", "max_input_tokens": 256000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000009}, "mistral/codestral-embed" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "codestral-embed", "max_input_tokens": 0, "max_output_tokens": 0, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0}, "mistral/devstral-small" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "devstral-small", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028}, "mistral/magistral-medium" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "magistral-medium", "max_input_tokens": 128000, "max_output_tokens": 64000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005}, "mistral/magistral-small" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "magistral-small", "max_input_tokens": 128000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "mistral/ministral-3b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "ministral-3b", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000004}, "mistral/ministral-8b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "ministral-8b", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "mistral/mistral-embed" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "mistral-embed", "max_input_tokens": 0, "max_output_tokens": 0, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "mistral/mistral-large" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "mistral-large", "max_input_tokens": 32000, "max_output_tokens": 4000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "mistral/mistral-saba-24b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "mistral-saba-24b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000079, "output_cost_per_token": 0.00000079}, "mistral/mistral-small" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "mistral-small", "max_input_tokens": 32000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "mistral/mixtral-8x22b-instruct" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "mixtral-8x22b-instruct", "max_input_tokens": 65536, "max_output_tokens": 2048, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012}, "mistral/pixtral-12b" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "pixtral-12b", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "mistral/pixtral-large" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "pixtral-large", "max_input_tokens": 128000, "max_output_tokens": 4000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "mistralai/Mistral-7B-Instruct-v0.1" : {"mode": "chat", "provider": "together_ai", "base_model": "mistral-7b-instruct"}, "mistralai/Mistral-Nemo-Instruct-2407" : {"mode": "chat", "provider": "nebius", "base_model": "mistral-nemo-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000012}, "mistralai/Mistral-Small-24B-Instruct-2501" : {"mode": "chat", "provider": "deepinfra", "base_model": "mistral-small-24b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000008}, "mistralai/Mistral-Small-3.2-24B-Instruct-2506" : {"mode": "chat", "provider": "deepinfra", "base_model": "mistral-small-3.2-24b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000002}, "mistralai/Mixtral-8x22B-Instruct-v0.1" : {"mode": "chat", "provider": "anyscale", "base_model": "mixtral-8x22b-instruct", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "mistralai/Mixtral-8x7B-Instruct-v0.1" : {"mode": "chat", "provider": "together_ai", "base_model": "mixtral-8x7b-instruct", "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006}, "mistralai/codestral-2" : {"mode": "chat", "provider": "vertex", "base_model": "codestral-2", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000009}, "mistralai/codestral-2508" : {"mode": "chat", "provider": "openrouter", "base_model": "codestral-2508", "max_input_tokens": 256000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000009, "cache_read_input_token_cost": 0.00000003}, "mistralai/codestral-2@001" : {"mode": "chat", "provider": "vertex", "base_model": "codestral-2", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000009}, "mistralai/codestral-embed-2505" : {"mode": "chat", "provider": "openrouter", "base_model": "codestral-embed-2505", "max_input_tokens": 8192, "input_cost_per_token": 0.00000015}, "mistralai/devstral-2512" : {"mode": "chat", "provider": "openrouter", "base_model": "devstral", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_image": 0, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "cache_read_input_token_cost": 0.00000004}, "mistralai/ministral-14b-2512" : {"mode": "chat", "provider": "openrouter", "base_model": "ministral-14b", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_image": 0, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "cache_read_input_token_cost": 0.00000002}, "mistralai/ministral-3b-2512" : {"mode": "chat", "provider": "openrouter", "base_model": "ministral-3b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_image": 0, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001, "cache_read_input_token_cost": 0.00000001}, "mistralai/ministral-8b-2512" : {"mode": "chat", "provider": "openrouter", "base_model": "ministral-8b", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_image": 0, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "cache_read_input_token_cost": 0.000000015}, "mistralai/mistral-7b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 8191, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000013}, "mistralai/mistral-7b-instruct-v0.2" : {"mode": "chat", "provider": "replicate", "base_model": "mistral-7b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025}, "mistralai/mistral-7b-v0.1" : {"mode": "chat", "provider": "replicate", "base_model": "mistral-7b", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025}, "mistralai/mistral-embed-2312" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-embed-2312", "max_input_tokens": 8192, "input_cost_per_token": 0.0000001}, "mistralai/mistral-large" : {"mode": "chat", "provider": "watsonx", "base_model": "mistral-large", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.00001}, "mistralai/mistral-large-2407" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-large-2407", "max_input_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.0000002}, "mistralai/mistral-large-2512" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-large", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_image": 0, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "cache_read_input_token_cost": 0.00000005}, "mistralai/mistral-medium-2505" : {"mode": "chat", "provider": "watsonx", "base_model": "mistral-medium", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.00001}, "mistralai/mistral-medium-3" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-medium-3", "max_input_tokens": 131072, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.00000004}, "mistralai/mistral-medium-3-5" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-medium-3-5", "max_input_tokens": 262144, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.0000075}, "mistralai/mistral-medium-3.1" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-medium-3.1", "max_input_tokens": 131072, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.00000004}, "mistralai/mistral-medium-3@001" : {"mode": "chat", "provider": "vertex", "base_model": "mistral-medium-3", "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "mistralai/mistral-nemo" : {"mode": "chat", "provider": "novita", "base_model": "mistral-nemo", "max_input_tokens": 60288, "max_output_tokens": 16000, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000017}, "mistralai/mistral-saba" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-saba", "max_input_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006, "cache_read_input_token_cost": 0.00000002}, "mistralai/mistral-small-24b-instruct-2501" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-small-24b-instruct-2501", "max_input_tokens": 32768, "max_output_tokens": 16384, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000008}, "mistralai/mistral-small-2503" : {"mode": "chat", "provider": "watsonx", "base_model": "mistral-small", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "mistralai/mistral-small-2603" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-small-2603", "max_input_tokens": 262144, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "cache_read_input_token_cost": 0.000000015}, "mistralai/mistral-small-3-1-24b-instruct-2503" : {"mode": "chat", "provider": "watsonx", "base_model": "mistral-small-3-1-24b-instruct", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "mistralai/mistral-small-3.1-24b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-small-3.1-24b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "mistralai/mistral-small-3.2-24b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "mistral-small-3.2-24b-instruct", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003}, "mistralai/mixtral-8x22b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "mixtral-8x22b-instruct", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000065, "cache_read_input_token_cost": 0.0000002}, "mistralai/mixtral-8x22b-instruct-v0.1" : {"mode": "chat", "provider": "nscale", "base_model": "mixtral-8x22b-instruct", "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006}, "mistralai/mixtral-8x7b-instruct-v0.1" : {"mode": "chat", "provider": "replicate", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.000001}, "mistralai/pixtral-12b-2409" : {"mode": "chat", "provider": "watsonx", "base_model": "pixtral-12b", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000035}, "mistralai/voxtral-mini-transcribe" : {"mode": "chat", "provider": "openrouter", "base_model": "voxtral-mini-transcribe", "max_input_tokens": 0, "input_cost_per_token": 0.003}, "mistralai/voxtral-mini-tts-2603" : {"mode": "chat", "provider": "openrouter", "base_model": "voxtral-mini-tts-2603", "max_input_tokens": 4096, "input_cost_per_token": 0.000016}, "mistralai/voxtral-small-24b-2507" : {"mode": "chat", "provider": "openrouter", "base_model": "voxtral-small-24b-2507", "max_input_tokens": 32000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003, "cache_read_input_token_cost": 0.00000001}, "mixtral-8x22B-Instruct-v0.1" : {"mode": "chat", "provider": "ollama", "base_model": "mixtral-8x22b-instruct", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0, "output_cost_per_token": 0}, "mixtral-8x7B-Instruct-v0.1" : {"mode": "chat", "provider": "ollama", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0, "output_cost_per_token": 0}, "mixtral-8x7b" : {"mode": "chat", "provider": "snowflake", "base_model": "mixtral-8x7b", "max_input_tokens": 32000, "max_output_tokens": 8192}, "mixtral-8x7b-instruct" : {"mode": "chat", "provider": "perplexity", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028}, "model_router" : {"mode": "chat", "provider": "azure", "base_model": "model-router", "input_cost_per_token": 0.00000014, "output_cost_per_token": 0}, "moonshot-v1-128k" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-128k", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005}, "moonshot-v1-128k-0430" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-128k", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005}, "moonshot-v1-128k-vision-preview" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-128k-vision", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005}, "moonshot-v1-32k" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-32k", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "moonshot-v1-32k-0430" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-32k", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "moonshot-v1-32k-vision-preview" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-32k-vision", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "moonshot-v1-8k" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-8k", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.000002}, "moonshot-v1-8k-0430" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-8k", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.000002}, "moonshot-v1-8k-vision-preview" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-8k-vision", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.000002}, "moonshot-v1-auto" : {"mode": "chat", "provider": "moonshot", "base_model": "moonshot-v1-auto", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000005}, "moonshot.kimi-k2-thinking" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2-thinking", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "moonshotai.kimi-k2-thinking" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000073, "output_cost_per_token": 0.00000303}, "moonshotai.kimi-k2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.00000303}, "moonshotai.kimi-k2.6" : {"mode": "chat", "provider": "moonshot", "base_model": "kimi-k2.6", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000003}, "moonshotai/Kimi-K2-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "kimi-k2-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.000002}, "moonshotai/Kimi-K2-Instruct-0905" : {"mode": "chat", "provider": "baseten", "base_model": "kimi-k2-instruct", "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "moonshotai/Kimi-K2-Thinking" : {"mode": "chat", "provider": "baseten", "base_model": "kimi-k2-thinking", "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "moonshotai/Kimi-K2.5" : {"mode": "chat", "provider": "together_ai", "base_model": "kimi-k2.5", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000028}, "moonshotai/kimi-k2" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "kimi-k2", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.00000055, "output_cost_per_token": 0.0000022}, "moonshotai/kimi-k2-0905" : {"mode": "chat", "provider": "openrouter", "base_model": "kimi-k2-0905", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "moonshotai/kimi-k2-instruct" : {"mode": "chat", "provider": "novita", "base_model": "kimi-k2-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000057, "output_cost_per_token": 0.0000023}, "moonshotai/kimi-k2-instruct-0905" : {"mode": "chat", "provider": "groq", "base_model": "kimi-k2-instruct", "max_input_tokens": 262144, "max_output_tokens": 16384, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003, "cache_read_input_token_cost": 0.0000005}, "moonshotai/kimi-k2-thinking" : {"mode": "chat", "provider": "novita", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "moonshotai/kimi-k2-thinking-maas" : {"mode": "chat", "provider": "vertex", "base_model": "kimi-k2-thinking", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "moonshotai/kimi-k2.5" : {"mode": "chat", "provider": "openrouter", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000003, "cache_read_input_token_cost": 0.0000001}, "moonshotai/kimi-k2.6" : {"mode": "chat", "provider": "openrouter", "base_model": "kimi-k2.6", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000003, "cache_read_input_token_cost": 0.0000001}, "morph-v3-fast" : {"mode": "chat", "provider": "morph", "base_model": "morph-v3-fast", "max_input_tokens": 16000, "max_output_tokens": 16000, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000012}, "morph-v3-large" : {"mode": "chat", "provider": "morph", "base_model": "morph-v3-large", "max_input_tokens": 16000, "max_output_tokens": 16000, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000019}, "morph/morph-v3-fast" : {"mode": "chat", "provider": "openrouter", "base_model": "morph-v3-fast", "max_input_tokens": 81920, "max_output_tokens": 38000, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000012}, "morph/morph-v3-large" : {"mode": "chat", "provider": "openrouter", "base_model": "morph-v3-large", "max_input_tokens": 262144, "max_output_tokens": 131072, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000019}, "multimodalembedding" : {"mode": "embedding", "provider": "vertex", "base_model": "multimodalembedding", "max_input_tokens": 2048, "input_cost_per_image": 0.0001, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0, "input_cost_per_character": 0.0000002, "input_cost_per_video_per_second": 0.0005}, "multimodalembedding@001" : {"mode": "embedding", "provider": "vertex", "base_model": "multimodalembedding", "max_input_tokens": 2048, "input_cost_per_image": 0.0001, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0, "input_cost_per_character": 0.0000002, "input_cost_per_video_per_second": 0.0005}, "nano" : {"mode": "audio_transcription", "provider": "assemblyai", "base_model": "nano", "input_cost_per_second": 0.00010278, "output_cost_per_second": 0}, "neural" : {"mode": "audio_speech", "provider": "aws_polly", "base_model": "neural", "input_cost_per_character": 0.000016}, "nex-agi/deepseek-v3.1-nex-n1" : {"mode": "chat", "provider": "openrouter", "base_model": "deepseek-v3.1-nex-n1", "max_input_tokens": 131072, "max_output_tokens": 163840, "input_cost_per_token": 0.000000135, "output_cost_per_token": 0.0000005}, "nomic-ai/nomic-embed-text-v1" : {"mode": "embedding", "provider": "fireworks", "base_model": "nomic-embed-text-v1", "max_input_tokens": 8192, "input_cost_per_token": 0.000000008, "output_cost_per_token": 0}, "nomic-ai/nomic-embed-text-v1.5" : {"mode": "embedding", "provider": "fireworks", "base_model": "nomic-embed-text", "max_input_tokens": 8192, "input_cost_per_token": 0.000000008, "output_cost_per_token": 0}, "nomic-embed-text" : {"mode": "embedding", "provider": "llamagate", "base_model": "nomic-embed-text", "max_input_tokens": 8192, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0}, "nousresearch/hermes-2-pro-llama-3-8b" : {"mode": "chat", "provider": "novita", "base_model": "hermes-2-pro-llama-3-8b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.00000014}, "nousresearch/hermes-3-llama-3.1-405b" : {"mode": "chat", "provider": "openrouter", "base_model": "hermes-3-llama-3.1-405b", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001}, "nousresearch/hermes-3-llama-3.1-70b" : {"mode": "chat", "provider": "openrouter", "base_model": "hermes-3-llama-3.1-70b", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000003}, "nousresearch/hermes-4-405b" : {"mode": "chat", "provider": "openrouter", "base_model": "hermes-4-405b", "max_input_tokens": 131072, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "nousresearch/hermes-4-70b" : {"mode": "chat", "provider": "openrouter", "base_model": "hermes-4-70b", "max_input_tokens": 131072, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.0000004}, "nova" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-atc" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-atc", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-automotive" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-automotive", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-conversationalai" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-conversationalai", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-drivethru" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-drivethru", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-finance" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-finance", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-general" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-general", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-meeting" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-meeting", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-phonecall" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-phonecall", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-video" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-video", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-2-voicemail" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-2-voicemail", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-3" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-3", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-3-general" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-3-general", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-3-medical" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-3-medical", "input_cost_per_second": 0.00008667, "output_cost_per_second": 0}, "nova-general" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-general", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-lite-v1" : {"mode": "chat", "provider": "amazon_nova", "base_model": "nova-lite-v1", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000024}, "nova-micro-v1" : {"mode": "chat", "provider": "amazon_nova", "base_model": "nova-micro-v1", "max_input_tokens": 128000, "max_output_tokens": 10000, "input_cost_per_token": 0.000000035, "output_cost_per_token": 0.00000014}, "nova-phonecall" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "nova-phonecall", "input_cost_per_second": 0.00007167, "output_cost_per_second": 0}, "nova-premier-v1" : {"mode": "chat", "provider": "amazon_nova", "base_model": "nova-premier-v1", "max_input_tokens": 1000000, "max_output_tokens": 10000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.0000125}, "nova-pro-v1" : {"mode": "chat", "provider": "amazon_nova", "base_model": "nova-pro-v1", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000032}, "nvidia.nemotron-nano-12b-v2" : {"mode": "chat", "provider": "bedrock", "base_model": "nvidia-nemotron-nano-12b-v2", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "nvidia.nemotron-nano-3-30b" : {"mode": "chat", "provider": "bedrock", "base_model": "nvidia-nemotron-nano-3-30b", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000024}, "nvidia.nemotron-nano-9b-v2" : {"mode": "chat", "provider": "bedrock", "base_model": "nvidia-nemotron-nano-9b-v2", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000023}, "nvidia.nemotron-super-3-120b" : {"mode": "chat", "provider": "bedrock", "base_model": "nvidia-nemotron-super-3-120b", "max_input_tokens": 256000, "max_output_tokens": 32768, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000065}, "nvidia/Llama-3.1-Nemotron-70B-Instruct" : {"mode": "chat", "provider": "deepinfra", "base_model": "llama-3.1-nemotron-70b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006}, "nvidia/Llama-3.1-Nemotron-Ultra-253B-v1" : {"mode": "chat", "provider": "nebius", "base_model": "llama-3.1-nemotron-ultra-253b-v1", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000018}, "nvidia/Llama-3.3-Nemotron-Super-49B-v1" : {"mode": "chat", "provider": "nebius", "base_model": "llama-3.3-nemotron-super-49b-v1", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004}, "nvidia/Llama-3.3-Nemotron-Super-49B-v1.5" : {"mode": "chat", "provider": "deepinfra", "base_model": "llama-3.3-nemotron-super-49b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004}, "nvidia/NVIDIA-Nemotron-Nano-9B-v2" : {"mode": "chat", "provider": "deepinfra", "base_model": "nvidia-nemotron-nano-9b-v2", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000016}, "nvidia/Nemotron-120B-A12B" : {"mode": "chat", "provider": "baseten", "base_model": "nemotron-120b-a12b", "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.00000075}, "nvidia/llama-3.3-nemotron-super-49b-v1.5" : {"mode": "chat", "provider": "openrouter", "base_model": "llama-3.3-nemotron-super-49b-v1.5", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004}, "nvidia/llama-3_2-nv-rerankqa-1b-v2" : {"mode": "rerank", "provider": "nvidia_nim", "base_model": "llama-3-2-nv-rerankqa-1b-v2", "input_cost_per_token": 0, "output_cost_per_token": 0}, "nvidia/nemotron-3-nano-30b-a3b" : {"mode": "chat", "provider": "openrouter", "base_model": "nemotron-3-nano-30b-a3b", "max_input_tokens": 262144, "max_output_tokens": 228000, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000002}, "nvidia/nemotron-3-super-120b-a12b" : {"mode": "chat", "provider": "openrouter", "base_model": "nemotron-3-super-120b-a12b", "max_input_tokens": 262144, "input_cost_per_token": 0.00000009, "output_cost_per_token": 0.00000045}, "nvidia/nemotron-3-ultra-550b-a55b" : {"mode": "chat", "provider": "openrouter", "base_model": "nemotron-3-ultra-550b-a55b", "max_input_tokens": 262144, "max_output_tokens": 16384, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.00000015}, "nvidia/nemotron-nano-9b-v2" : {"mode": "chat", "provider": "openrouter", "base_model": "nemotron-nano-9b-v2", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000016}, "nvidia/nv-rerankqa-mistral-4b-v3" : {"mode": "rerank", "provider": "nvidia_nim", "base_model": "nv-rerankqa-mistral-4b-v3", "input_cost_per_token": 0, "output_cost_per_token": 0}, "nvidia/parakeet-tdt-0.6b-v3" : {"mode": "chat", "provider": "openrouter", "base_model": "parakeet-tdt-0.6b-v3", "max_input_tokens": 0, "input_cost_per_token": 0.0015}, "o1" : {"mode": "chat", "provider": "azure", "base_model": "o1", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00006, "cache_read_input_token_cost": 0.0000075}, "o1-2024-12-17" : {"mode": "chat", "provider": "azure", "base_model": "o1", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00006, "cache_read_input_token_cost": 0.0000075}, "o1-mini" : {"mode": "chat", "provider": "azure", "base_model": "o1-mini", "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.00000121, "output_cost_per_token": 0.00000484, "cache_read_input_token_cost": 0.000000605}, "o1-mini-2024-09-12" : {"mode": "chat", "provider": "azure", "base_model": "o1-mini", "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055}, "o1-preview" : {"mode": "chat", "provider": "azure", "base_model": "o1", "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00006, "cache_read_input_token_cost": 0.0000075}, "o1-preview-2024-09-12" : {"mode": "chat", "provider": "azure", "base_model": "o1", "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00006, "cache_read_input_token_cost": 0.0000075}, "o1-pro" : {"mode": "responses", "provider": "openai", "base_model": "o1-pro", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00015, "output_cost_per_token": 0.0006, "input_cost_per_token_batches": 0.000075, "output_cost_per_token_batches": 0.0003}, "o1-pro-2025-03-19" : {"mode": "responses", "provider": "openai", "base_model": "o1-pro", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00015, "output_cost_per_token": 0.0006, "input_cost_per_token_batches": 0.000075, "output_cost_per_token_batches": 0.0003}, "o3" : {"mode": "chat", "provider": "azure", "base_model": "o3", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "cache_read_input_token_cost": 0.0000005}, "o3-2025-04-16" : {"mode": "chat", "provider": "openai", "base_model": "o3", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "cache_read_input_token_cost": 0.0000005}, "o3-deep-research" : {"mode": "responses", "provider": "azure", "base_model": "o3", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00004, "cache_read_input_token_cost": 0.0000025}, "o3-deep-research-2025-06-26" : {"mode": "responses", "provider": "openai", "base_model": "o3", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00004, "cache_read_input_token_cost": 0.0000025, "input_cost_per_token_batches": 0.000005, "output_cost_per_token_batches": 0.00002}, "o3-mini" : {"mode": "chat", "provider": "azure", "base_model": "o3-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055}, "o3-mini-2025-01-31" : {"mode": "chat", "provider": "openai", "base_model": "o3-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055}, "o3-pro" : {"mode": "responses", "provider": "azure", "base_model": "o3-pro", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00002, "output_cost_per_token": 0.00008, "input_cost_per_token_batches": 0.00001, "output_cost_per_token_batches": 0.00004}, "o3-pro-2025-06-10" : {"mode": "responses", "provider": "openai", "base_model": "o3-pro", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00002, "output_cost_per_token": 0.00008, "input_cost_per_token_batches": 0.00001, "output_cost_per_token_batches": 0.00004}, "o4-mini" : {"mode": "chat", "provider": "azure", "base_model": "o4-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.000000275}, "o4-mini-2025-04-16" : {"mode": "chat", "provider": "openai", "base_model": "o4-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.000000275}, "o4-mini-deep-research" : {"mode": "responses", "provider": "openai", "base_model": "o4-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "cache_read_input_token_cost": 0.0000005, "input_cost_per_token_batches": 0.000001, "output_cost_per_token_batches": 0.000004}, "o4-mini-deep-research-2025-06-26" : {"mode": "responses", "provider": "openai", "base_model": "o4-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "cache_read_input_token_cost": 0.0000005, "input_cost_per_token_batches": 0.000001, "output_cost_per_token_batches": 0.000004}, "omni-moderation-2024-09-26" : {"mode": "moderation", "provider": "openai", "base_model": "omni-moderation", "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0, "output_cost_per_token": 0}, "omni-moderation-latest" : {"mode": "moderation", "provider": "openai", "base_model": "omni-moderation", "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0, "output_cost_per_token": 0}, "open-codestral-mamba" : {"mode": "chat", "provider": "mistral", "base_model": "codestral-mamba", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025}, "open-mistral-7b" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-7b", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025}, "open-mistral-nemo" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-nemo", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000003}, "open-mistral-nemo-2407" : {"mode": "chat", "provider": "mistral", "base_model": "mistral-nemo", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000003}, "open-mixtral-8x22b" : {"mode": "chat", "provider": "mistral", "base_model": "mixtral-8x22b", "max_input_tokens": 65336, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "open-mixtral-8x7b" : {"mode": "chat", "provider": "mistral", "base_model": "mixtral-8x7b", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000007}, "openai-gpt-4o" : {"mode": "chat", "provider": "gradient_ai", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384}, "openai-gpt-4o-mini" : {"mode": "chat", "provider": "gradient_ai", "base_model": "gpt-4o-mini", "max_input_tokens": 128000, "max_output_tokens": 16384}, "openai-o3" : {"mode": "chat", "provider": "gradient_ai", "base_model": "o3", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "openai-o3-mini" : {"mode": "chat", "provider": "gradient_ai", "base_model": "o3-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044}, "openai.gpt-5" : {"mode": "chat", "provider": "oci", "base_model": "gpt-5", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001}, "openai.gpt-5-mini" : {"mode": "chat", "provider": "oci", "base_model": "gpt-5-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002}, "openai.gpt-5-nano" : {"mode": "chat", "provider": "oci", "base_model": "gpt-5-nano", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000004}, "openai.gpt-oss-120b" : {"mode": "chat", "provider": "bedrock", "base_model": "gpt-oss-120b", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "openai.gpt-oss-120b-1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "gpt-oss-120b", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "openai.gpt-oss-20b" : {"mode": "chat", "provider": "bedrock", "base_model": "gpt-oss-20b", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003}, "openai.gpt-oss-20b-1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "gpt-oss-20b", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.0000003}, "openai.gpt-oss-safeguard-120b" : {"mode": "chat", "provider": "bedrock", "base_model": "gpt-oss-120b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "openai.gpt-oss-safeguard-20b" : {"mode": "chat", "provider": "bedrock", "base_model": "gpt-oss-20b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.0000002}, "openai/gpt-3.5-turbo" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "gpt-3.5-turbo", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "openai/gpt-3.5-turbo-0613" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-3.5-turbo-0613", "max_input_tokens": 4095, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000002}, "openai/gpt-3.5-turbo-16k" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-3.5-turbo-16k", "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000004}, "openai/gpt-3.5-turbo-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-3.5-turbo-instruct", "max_input_tokens": 4095, "max_output_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002}, "openai/gpt-4" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4", "max_input_tokens": 8191, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006}, "openai/gpt-4-0314" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4-0314", "max_input_tokens": 8191, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006}, "openai/gpt-4-1106-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4-1106-preview", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003}, "openai/gpt-4-turbo" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "gpt-4-turbo", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003}, "openai/gpt-4-turbo-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4-turbo-preview", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003}, "openai/gpt-4.1" : {"mode": "chat", "provider": "replicate", "base_model": "gpt-4.1", "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "openai/gpt-4.1-mini" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4.1-mini", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000016, "cache_read_input_token_cost": 0.0000001}, "openai/gpt-4.1-nano" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4.1-nano", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0.000000025}, "openai/gpt-4o" : {"mode": "chat", "provider": "gmi", "base_model": "gpt-4o", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "openai/gpt-4o-2024-05-13" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015}, "openai/gpt-4o-2024-08-06" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4o-2024-08-06", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125}, "openai/gpt-4o-2024-11-20" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4o-2024-11-20", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125}, "openai/gpt-4o-mini" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "gpt-4o-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "cache_read_input_token_cost": 0.000000075, "cache_creation_input_token_cost": 0}, "openai/gpt-4o-mini-2024-07-18" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4o-mini-2024-07-18", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "cache_read_input_token_cost": 0.000000075}, "openai/gpt-4o-mini-search-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4o-mini-search-preview", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "openai/gpt-4o-mini-transcribe" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4o-mini-transcribe", "max_input_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.000005}, "openai/gpt-4o-mini-tts-2025-12-15" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4o-mini-tts-2025-12-15", "max_input_tokens": 4096, "input_cost_per_token": 0.0000006}, "openai/gpt-4o-search-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4o-search-preview", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "openai/gpt-4o-transcribe" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-4o-transcribe", "max_input_tokens": 128000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "openai/gpt-5" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "openai/gpt-5-chat" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "openai/gpt-5-codex" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5-codex", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "openai/gpt-5-image" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5-image", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000125}, "openai/gpt-5-image-mini" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5-image-mini", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.00000025}, "openai/gpt-5-mini" : {"mode": "responses", "provider": "perplexity", "base_model": "gpt-5-mini"}, "openai/gpt-5-nano" : {"mode": "chat", "provider": "replicate", "base_model": "gpt-5-nano", "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000004}, "openai/gpt-5-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5-pro", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00012}, "openai/gpt-5.1" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.1", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000013}, "openai/gpt-5.1-chat" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.1-chat", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000013}, "openai/gpt-5.1-codex" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.1-codex", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.00000013}, "openai/gpt-5.1-codex-max" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.1-codex-max", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00001, "cache_read_input_token_cost": 0.000000125}, "openai/gpt-5.1-codex-mini" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.1-codex-mini", "max_input_tokens": 400000, "max_output_tokens": 100000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.000000025}, "openai/gpt-5.2" : {"mode": "responses", "provider": "perplexity", "base_model": "gpt-5.2"}, "openai/gpt-5.2-chat" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.2-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_image": 0, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175}, "openai/gpt-5.2-codex" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.2-codex", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175}, "openai/gpt-5.2-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.2-pro", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_image": 0, "input_cost_per_token": 0.000021, "output_cost_per_token": 0.000168}, "openai/gpt-5.3-chat" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.3-chat", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175}, "openai/gpt-5.3-codex" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.3-codex", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000175, "output_cost_per_token": 0.000014, "cache_read_input_token_cost": 0.000000175}, "openai/gpt-5.4" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.4", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.00000025}, "openai/gpt-5.4-image-2" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.4-image-2", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.000002}, "openai/gpt-5.4-mini" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.4-mini", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000075, "output_cost_per_token": 0.0000045, "cache_read_input_token_cost": 0.000000075}, "openai/gpt-5.4-nano" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.4-nano", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.00000125, "cache_read_input_token_cost": 0.00000002}, "openai/gpt-5.4-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.4-pro", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00018}, "openai/gpt-5.5" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.5", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00003, "cache_read_input_token_cost": 0.0000005}, "openai/gpt-5.5-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-5.5-pro", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00018}, "openai/gpt-audio" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-audio", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "openai/gpt-audio-mini" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-audio-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000024}, "openai/gpt-chat-latest" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-chat-latest", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00003, "cache_read_input_token_cost": 0.0000005}, "openai/gpt-image-1.5" : {"mode": "image_generation", "provider": "replicate", "base_model": "gpt-image-1.5", "output_cost_per_image_low_quality": 0.013, "output_cost_per_image_auto_quality": 0.136, "output_cost_per_image_high_quality": 0.136, "output_cost_per_image_medium_quality": 0.05}, "openai/gpt-oss-120b" : {"mode": "chat", "provider": "novita", "base_model": "gpt-oss-120b", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025}, "openai/gpt-oss-120b-maas" : {"mode": "chat", "provider": "vertex", "base_model": "gpt-oss-120b", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "openai/gpt-oss-20b" : {"mode": "chat", "provider": "wandb", "base_model": "gpt-oss-20b", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.005, "output_cost_per_token": 0.02}, "openai/gpt-oss-20b-maas" : {"mode": "chat", "provider": "vertex", "base_model": "gpt-oss-20b", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003}, "openai/gpt-oss-safeguard-20b" : {"mode": "chat", "provider": "groq", "base_model": "gpt-oss-20b", "max_input_tokens": 131072, "max_output_tokens": 65536, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003, "cache_read_input_token_cost": 0.000000037}, "openai/o1" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "o1", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00006, "cache_read_input_token_cost": 0.0000075, "cache_creation_input_token_cost": 0}, "openai/o1-mini" : {"mode": "chat", "provider": "replicate", "base_model": "o1-mini", "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044}, "openai/o1-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "o1-pro", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00015, "output_cost_per_token": 0.0006}, "openai/o3" : {"mode": "chat", "provider": "openrouter", "base_model": "o3", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "cache_read_input_token_cost": 0.0000005}, "openai/o3-deep-research" : {"mode": "chat", "provider": "openrouter", "base_model": "o3-deep-research", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00004, "cache_read_input_token_cost": 0.0000025}, "openai/o3-mini" : {"mode": "chat", "provider": "openrouter", "base_model": "o3-mini", "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055}, "openai/o3-mini-high" : {"mode": "chat", "provider": "openrouter", "base_model": "o3-mini-high", "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055}, "openai/o3-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "o3-pro", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00002, "output_cost_per_token": 0.00008}, "openai/o4-mini" : {"mode": "chat", "provider": "replicate", "base_model": "o4-mini", "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000004}, "openai/o4-mini-deep-research" : {"mode": "chat", "provider": "openrouter", "base_model": "o4-mini-deep-research", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "cache_read_input_token_cost": 0.0000005}, "openai/o4-mini-high" : {"mode": "chat", "provider": "openrouter", "base_model": "o4-mini-high", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.000000275}, "openai/text-embedding-3-large" : {"mode": "chat", "provider": "openrouter", "base_model": "text-embedding-3-large", "max_input_tokens": 8192, "input_cost_per_token": 0.00000013}, "openai/text-embedding-3-small" : {"mode": "embedding", "provider": "vercel_ai_gateway", "base_model": "text-embedding-3-small", "max_input_tokens": 0, "max_output_tokens": 0, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0}, "openai/text-embedding-ada-002" : {"mode": "embedding", "provider": "vercel_ai_gateway", "base_model": "text-embedding-ada-002", "max_input_tokens": 0, "max_output_tokens": 0, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "openai/whisper-1" : {"mode": "chat", "provider": "openrouter", "base_model": "whisper-1", "max_input_tokens": 0, "input_cost_per_token": 0.006}, "openai/whisper-large-v3" : {"mode": "chat", "provider": "openrouter", "base_model": "whisper-large-v3", "max_input_tokens": 0, "input_cost_per_token": 0.0015}, "openai/whisper-large-v3-turbo" : {"mode": "chat", "provider": "openrouter", "base_model": "whisper-large-v3-turbo", "max_input_tokens": 0, "input_cost_per_token": 0.04}, "openrouter/auto" : {"mode": "chat", "provider": "openrouter", "base_model": "auto", "max_input_tokens": 2000000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "openrouter/bodybuilder" : {"mode": "chat", "provider": "openrouter", "base_model": "bodybuilder", "max_input_tokens": 128000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "openrouter/free" : {"mode": "chat", "provider": "openrouter", "base_model": "free", "max_input_tokens": 200000, "input_cost_per_token": 0, "output_cost_per_token": 0}, "openrouter/fusion" : {"mode": "chat", "provider": "openrouter", "base_model": "fusion", "max_input_tokens": 128000, "input_cost_per_token": -1, "output_cost_per_token": -1}, "openrouter/pareto-code" : {"mode": "chat", "provider": "openrouter", "base_model": "pareto-code", "max_input_tokens": 2000000, "input_cost_per_token": -1, "output_cost_per_token": -1}, "openthinker-7b" : {"mode": "chat", "provider": "llamagate", "base_model": "openthinker-7b", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000015}, "orca-mini" : {"mode": "completion", "provider": "ollama", "base_model": "orca-mini", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "oswe-vscode-prime" : {"mode": "chat", "provider": "github_copilot", "base_model": "oswe-vscode-prime", "max_input_tokens": 264000, "max_output_tokens": 64000}, "outpaint" : {"mode": "image_edit", "provider": "stability", "base_model": "outpaint", "output_cost_per_image": 0.004}, "paddlepaddle/paddleocr-vl" : {"mode": "chat", "provider": "novita", "base_model": "paddleocr-vl", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0.00000002}, "parse-legacy" : {"mode": "ocr", "provider": "reducto", "base_model": "parse-legacy"}, "parse-v3" : {"mode": "ocr", "provider": "reducto", "base_model": "parse-v3"}, "perceptron/perceptron-mk1" : {"mode": "chat", "provider": "openrouter", "base_model": "perceptron-mk1", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000015}, "perplexity/pplx-embed-v1-0.6b" : {"mode": "chat", "provider": "openrouter", "base_model": "pplx-embed-v1-0.6b", "max_input_tokens": 32000, "input_cost_per_token": 0.000000004}, "perplexity/pplx-embed-v1-4b" : {"mode": "chat", "provider": "openrouter", "base_model": "pplx-embed-v1-4b", "max_input_tokens": 32000, "input_cost_per_token": 0.00000003}, "perplexity/sonar" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "sonar", "max_input_tokens": 127000, "max_output_tokens": 8000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001}, "perplexity/sonar-deep-research" : {"mode": "chat", "provider": "openrouter", "base_model": "sonar-deep-research", "max_input_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "perplexity/sonar-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "sonar-pro", "max_input_tokens": 200000, "max_output_tokens": 8000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "perplexity/sonar-pro-search" : {"mode": "chat", "provider": "openrouter", "base_model": "sonar-pro-search", "max_input_tokens": 200000, "max_output_tokens": 8000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "perplexity/sonar-reasoning" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "sonar", "max_input_tokens": 127000, "max_output_tokens": 8000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005}, "perplexity/sonar-reasoning-pro" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "sonar-reasoning-pro", "max_input_tokens": 127000, "max_output_tokens": 8000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "pixtral-12b-2409" : {"mode": "chat", "provider": "mistral", "base_model": "pixtral-12b", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "pixtral-large-2411" : {"mode": "chat", "provider": "mistral", "base_model": "pixtral-large", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "pixtral-large-latest" : {"mode": "chat", "provider": "mistral", "base_model": "pixtral-large", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "pixverse/pixverse-v4" : {"mode": "video_generation", "provider": "replicate", "base_model": "pixverse/pixverse-v4", "output_cost_per_video_per_second": 0.06}, "pixverse/pixverse-v4.5" : {"mode": "video_generation", "provider": "replicate", "base_model": "pixverse/pixverse", "output_cost_per_video_per_second": 0.06}, "playai-tts" : {"mode": "audio_speech", "provider": "groq", "base_model": "playai-tts", "max_input_tokens": 10000, "max_output_tokens": 10000, "input_cost_per_character": 0.00005}, "pplx-70b-chat" : {"mode": "chat", "provider": "perplexity", "base_model": "pplx-70b-chat", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000028}, "pplx-70b-online" : {"mode": "chat", "provider": "perplexity", "base_model": "pplx-70b-online", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0.0000028}, "pplx-7b-chat" : {"mode": "chat", "provider": "perplexity", "base_model": "pplx-7b-chat", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028}, "pplx-7b-online" : {"mode": "chat", "provider": "perplexity", "base_model": "pplx-7b-online", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0.00000028}, "pplx-embed-v1-0.6b" : {"mode": "embedding", "provider": "perplexity", "base_model": "pplx-embed-v1-0.6b", "max_input_tokens": 32768, "input_cost_per_token": 0.000000004, "output_cost_per_token": 0}, "pplx-embed-v1-4b" : {"mode": "embedding", "provider": "perplexity", "base_model": "pplx-embed-v1-4b", "max_input_tokens": 32768, "input_cost_per_token": 0.00000003, "output_cost_per_token": 0}, "preset/advanced-deep-research" : {"mode": "responses", "provider": "perplexity", "base_model": "preset/advanced"}, "preset/deep-research" : {"mode": "responses", "provider": "perplexity", "base_model": "preset/deep-research"}, "preset/fast-search" : {"mode": "responses", "provider": "perplexity", "base_model": "preset/fast-search"}, "preset/pro-search" : {"mode": "responses", "provider": "perplexity", "base_model": "preset/pro-search"}, "prime-intellect/intellect-3" : {"mode": "chat", "provider": "openrouter", "base_model": "intellect-3", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000011}, "prunaai/flux-fast" : {"mode": "image_generation", "provider": "replicate", "base_model": "prunaai/flux-fast", "output_cost_per_image": 0.005}, "prunaai/hidream-l1-fast" : {"mode": "image_generation", "provider": "replicate", "base_model": "prunaai/hidream-l1-fast", "output_cost_per_image": 0.005}, "prunaai/p-image" : {"mode": "image_generation", "provider": "replicate", "base_model": "prunaai/p-image", "output_cost_per_image": 0.005}, "qwen-3-235b-a22b-instruct-2507" : {"mode": "chat", "provider": "cerebras", "base_model": "qwen3-235b-a22b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000012, "input_cost_per_audio_token": 0}, "qwen-3-32b" : {"mode": "chat", "provider": "cerebras", "base_model": "qwen3-32b", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000008}, "qwen-coder" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-coder", "max_input_tokens": 1000000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000015}, "qwen-flash" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-flash", "max_input_tokens": 997952, "max_output_tokens": 32768}, "qwen-flash-2025-07-28" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-flash", "max_input_tokens": 997952, "max_output_tokens": 32768}, "qwen-image-2.0" : {"mode": "image_generation", "provider": "dashscope", "base_model": "qwen-image-2.0"}, "qwen-image-2.0-pro" : {"mode": "image_generation", "provider": "dashscope", "base_model": "qwen-image-2.0-pro"}, "qwen-max" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-max", "max_input_tokens": 30720, "max_output_tokens": 8192, "input_cost_per_token": 0.0000016, "output_cost_per_token": 0.0000064}, "qwen-plus" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-plus", "max_input_tokens": 129024, "max_output_tokens": 16384, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000012}, "qwen-plus-2025-01-25" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-plus", "max_input_tokens": 129024, "max_output_tokens": 8192, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000012}, "qwen-plus-2025-04-28" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-plus", "max_input_tokens": 129024, "max_output_tokens": 16384, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000012}, "qwen-plus-2025-07-14" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-plus", "max_input_tokens": 129024, "max_output_tokens": 16384, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000012}, "qwen-plus-2025-07-28" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-plus", "max_input_tokens": 997952, "max_output_tokens": 32768}, "qwen-plus-2025-09-11" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-plus", "max_input_tokens": 997952, "max_output_tokens": 32768}, "qwen-plus-latest" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-plus", "max_input_tokens": 997952, "max_output_tokens": 32768}, "qwen-turbo" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-turbo", "max_input_tokens": 129024, "max_output_tokens": 16384, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000002}, "qwen-turbo-2024-11-01" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-turbo", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000002}, "qwen-turbo-2025-04-28" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-turbo", "max_input_tokens": 1000000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000002}, "qwen-turbo-latest" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen-turbo", "max_input_tokens": 1000000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000002}, "qwen.qwen3-235b-a22b-2507-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-235b-a22b", "max_input_tokens": 262144, "max_output_tokens": 131072, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000088}, "qwen.qwen3-32b-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-32b", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "qwen.qwen3-coder-30b-a3b-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-30b-a3b", "max_input_tokens": 262144, "max_output_tokens": 131072, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006}, "qwen.qwen3-coder-480b-a35b-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-480b-a35b", "max_input_tokens": 262000, "max_output_tokens": 65536, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.0000018}, "qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000012}, "qwen.qwen3-next-80b-a3b" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-next-80b-a3b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000012}, "qwen.qwen3-vl-235b-a22b" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-vl-235b-a22b", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000053, "output_cost_per_token": 0.00000266}, "qwen/qwen-2.5-72b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen-2.5-72b-instruct", "max_input_tokens": 32768, "max_output_tokens": 16384, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.0000004}, "qwen/qwen-2.5-7b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen-2.5-7b-instruct", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.0000001}, "qwen/qwen-2.5-coder-32b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen2.5-coder-32b-instruct", "max_input_tokens": 33792, "max_output_tokens": 33792, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000018}, "qwen/qwen-image" : {"mode": "image_generation", "provider": "replicate", "base_model": "qwen-image", "output_cost_per_image": 0.025}, "qwen/qwen-mt-plus" : {"mode": "chat", "provider": "novita", "base_model": "qwen-mt-plus", "max_input_tokens": 16384, "max_output_tokens": 8192, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000075}, "qwen/qwen-plus" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen-plus", "max_input_tokens": 1000000, "max_output_tokens": 32768, "input_cost_per_token": 0.00000026, "output_cost_per_token": 0.00000078, "cache_read_input_token_cost": 0.000000052, "cache_creation_input_token_cost": 0.000000325}, "qwen/qwen-plus-2025-07-28" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen-plus-2025-07-28", "max_input_tokens": 1000000, "max_output_tokens": 32768, "input_cost_per_token": 0.00000026, "output_cost_per_token": 0.00000078}, "qwen/qwen-plus-2025-07-28:thinking" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen-plus-2025-07-28:thinking", "max_input_tokens": 1000000, "max_output_tokens": 32768, "input_cost_per_token": 0.00000026, "output_cost_per_token": 0.00000078, "cache_creation_input_token_cost": 0.000000325}, "qwen/qwen-vl-plus" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen-vl-plus", "max_input_tokens": 8192, "max_output_tokens": 2048, "input_cost_per_token": 0.00000021, "output_cost_per_token": 0.00000063}, "qwen/qwen2.5-7b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "qwen2.5-7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000007}, "qwen/qwen2.5-vl-72b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen2.5-vl-72b-instruct", "max_input_tokens": 32000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000075}, "qwen/qwen3-14b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-14b", "max_input_tokens": 40960, "max_output_tokens": 40960, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.00000024}, "qwen/qwen3-235b-a22b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-235b-a22b", "max_input_tokens": 131072, "max_output_tokens": 8192, "input_cost_per_token": 0.000000455, "output_cost_per_token": 0.00000182}, "qwen/qwen3-235b-a22b-2507" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-235b-a22b", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.000000071, "output_cost_per_token": 0.0000001}, "qwen/qwen3-235b-a22b-fp8" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-235b-a22b-fp8", "max_input_tokens": 40960, "max_output_tokens": 20000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000008}, "qwen/qwen3-235b-a22b-instruct-2507" : {"mode": "chat", "provider": "replicate", "base_model": "qwen3-235b-a22b-instruct", "input_cost_per_token": 0.000000264, "output_cost_per_token": 0.00000106}, "qwen/qwen3-235b-a22b-instruct-2507-maas" : {"mode": "chat", "provider": "vertex", "base_model": "qwen3-235b-a22b-instruct", "max_input_tokens": 262144, "max_output_tokens": 16384, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000001}, "qwen/qwen3-235b-a22b-thinking-2507" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-235b-a22b-thinking", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.000003}, "qwen/qwen3-30b-a3b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-30b-a3b", "max_input_tokens": 40960, "max_output_tokens": 16384, "input_cost_per_token": 0.00000009, "output_cost_per_token": 0.00000045}, "qwen/qwen3-30b-a3b-fp8" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-30b-a3b-fp8", "max_input_tokens": 40960, "max_output_tokens": 20000, "input_cost_per_token": 0.00000009, "output_cost_per_token": 0.00000045}, "qwen/qwen3-30b-a3b-instruct-2507" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-30b-a3b-instruct-2507", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000004815, "output_cost_per_token": 0.00000019305}, "qwen/qwen3-30b-a3b-thinking-2507" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-30b-a3b-thinking-2507", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0.00000008}, "qwen/qwen3-32b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-32b", "max_input_tokens": 40960, "max_output_tokens": 16384, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000028}, "qwen/qwen3-32b-fp8" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-32b-fp8", "max_input_tokens": 40960, "max_output_tokens": 20000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.00000045}, "qwen/qwen3-4b-fp8" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-4b-fp8", "max_input_tokens": 128000, "max_output_tokens": 20000, "input_cost_per_token": 0.00000003, "output_cost_per_token": 0.00000003}, "qwen/qwen3-8b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-8b", "max_input_tokens": 40960, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0.00000005}, "qwen/qwen3-8b-fp8" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-8b-fp8", "max_input_tokens": 128000, "max_output_tokens": 20000, "input_cost_per_token": 0.000000035, "output_cost_per_token": 0.000000138}, "qwen/qwen3-asr-flash-2026-02-10" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-asr-flash-2026-02-10", "max_input_tokens": 0, "input_cost_per_token": 0.000035}, "qwen/qwen3-coder" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-coder", "max_input_tokens": 262100, "max_output_tokens": 262100, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000095}, "qwen/qwen3-coder-30b-a3b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-coder-30b-a3b-instruct", "max_input_tokens": 160000, "max_output_tokens": 32768, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000027}, "qwen/qwen3-coder-480b-a35b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-coder-480b-a35b-instruct", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000013}, "qwen/qwen3-coder-480b-a35b-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "qwen3-coder-480b-a35b-instruct", "max_input_tokens": 262144, "max_output_tokens": 32768, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000004}, "qwen/qwen3-coder-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-coder-flash", "max_input_tokens": 1000000, "max_output_tokens": 65536, "input_cost_per_token": 0.000000195, "output_cost_per_token": 0.000000975, "cache_read_input_token_cost": 0.000000039, "cache_creation_input_token_cost": 0.00000024375}, "qwen/qwen3-coder-next" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000011, "output_cost_per_token": 0.0000008, "cache_read_input_token_cost": 0.00000007}, "qwen/qwen3-coder-plus" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-coder-plus", "max_input_tokens": 997952, "max_output_tokens": 65536, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.00000013, "cache_creation_input_token_cost": 0.0000008125}, "qwen/qwen3-embedding-0.6b" : {"mode": "embedding", "provider": "novita", "base_model": "qwen3-embedding-0.6b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0}, "qwen/qwen3-embedding-4b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-embedding-4b", "max_input_tokens": 32768, "input_cost_per_token": 0.00000002}, "qwen/qwen3-embedding-8b" : {"mode": "embedding", "provider": "novita", "base_model": "qwen3-embedding-8b", "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0}, "qwen/qwen3-max" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-max", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.00000211, "output_cost_per_token": 0.00000845}, "qwen/qwen3-max-thinking" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-max-thinking", "max_input_tokens": 262144, "max_output_tokens": 32768, "input_cost_per_token": 0.00000078, "output_cost_per_token": 0.0000039}, "qwen/qwen3-next-80b-a3b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-next-80b-a3b-instruct", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000015}, "qwen/qwen3-next-80b-a3b-instruct-maas" : {"mode": "chat", "provider": "vertex", "base_model": "qwen3-next-80b-a3b-instruct", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000012}, "qwen/qwen3-next-80b-a3b-thinking" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-next-80b-a3b-thinking", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.0000000975, "output_cost_per_token": 0.00000078}, "qwen/qwen3-next-80b-a3b-thinking-maas" : {"mode": "chat", "provider": "vertex", "base_model": "qwen3-next-80b-a3b-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000012}, "qwen/qwen3-omni-30b-a3b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-omni-30b-a3b-instruct", "max_input_tokens": 65536, "max_output_tokens": 16384, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000097}, "qwen/qwen3-omni-30b-a3b-thinking" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-omni-30b-a3b-thinking", "max_input_tokens": 65536, "max_output_tokens": 16384, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000097}, "qwen/qwen3-reranker-8b" : {"mode": "rerank", "provider": "novita", "base_model": "qwen3-reranker-8b", "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000005}, "qwen/qwen3-vl-235b-a22b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-vl-235b-a22b-instruct", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000015}, "qwen/qwen3-vl-235b-a22b-thinking" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-vl-235b-a22b-thinking", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000098, "output_cost_per_token": 0.00000395}, "qwen/qwen3-vl-30b-a3b-instruct" : {"mode": "chat", "provider": "novita", "base_model": "qwen3-vl-30b-a3b-instruct", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000007}, "qwen/qwen3-vl-30b-a3b-thinking" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-vl-30b-a3b-thinking", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000156}, "qwen/qwen3-vl-32b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-vl-32b-instruct", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.000000104, "output_cost_per_token": 0.000000416}, "qwen/qwen3-vl-8b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-vl-8b-instruct", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.0000005}, "qwen/qwen3-vl-8b-thinking" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3-vl-8b-thinking", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.000000117, "output_cost_per_token": 0.000001365}, "qwen/qwen3.5-122b-a10b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.5-122b-a10b", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "qwen/qwen3.5-27b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.5-27b", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000024}, "qwen/qwen3.5-35b-a3b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.5-35b-a3b", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.00000005}, "qwen/qwen3.5-397b-a17b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.5-397b-a17b", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000036}, "qwen/qwen3.5-9b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.5-9b", "max_input_tokens": 262144, "max_output_tokens": 81920, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000015}, "qwen/qwen3.5-flash-02-23" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.5-flash", "max_input_tokens": 1000000, "max_output_tokens": 65536, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004}, "qwen/qwen3.5-plus-02-15" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.5-plus", "max_input_tokens": 1000000, "max_output_tokens": 65536, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000024}, "qwen/qwen3.5-plus-20260420" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.5-plus-20260420", "max_input_tokens": 1000000, "max_output_tokens": 65536, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000018, "cache_creation_input_token_cost": 0.000000375}, "qwen/qwen3.6-27b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.6-27b", "max_input_tokens": 262140, "max_output_tokens": 262140, "input_cost_per_token": 0.00000029, "output_cost_per_token": 0.0000032}, "qwen/qwen3.6-35b-a3b" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.6-35b-a3b", "max_input_tokens": 262140, "max_output_tokens": 262140, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.000001}, "qwen/qwen3.6-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.6-flash", "max_input_tokens": 1000000, "max_output_tokens": 65536, "input_cost_per_token": 0.0000001875, "output_cost_per_token": 0.000001125, "cache_creation_input_token_cost": 0.000000234375}, "qwen/qwen3.6-max-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.6-max-preview", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.00000104, "output_cost_per_token": 0.00000624, "cache_creation_input_token_cost": 0.0000013}, "qwen/qwen3.6-plus" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.6-plus", "max_input_tokens": 1000000, "max_output_tokens": 65536, "input_cost_per_token": 0.000000325, "output_cost_per_token": 0.00000195, "cache_creation_input_token_cost": 0.00000040625}, "qwen/qwen3.7-max" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.7-max", "max_input_tokens": 1000000, "max_output_tokens": 65536, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.00000375, "cache_read_input_token_cost": 0.00000025, "cache_creation_input_token_cost": 0.0000015625}, "qwen/qwen3.7-plus" : {"mode": "chat", "provider": "openrouter", "base_model": "qwen3.7-plus", "max_input_tokens": 1000000, "max_output_tokens": 65536, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000016, "cache_read_input_token_cost": 0.00000008, "cache_creation_input_token_cost": 0.0000005}, "qwen2.5-coder-7b" : {"mode": "chat", "provider": "llamagate", "base_model": "qwen2.5-coder-7b", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000012}, "qwen25-coder-32b-instruct" : {"mode": "chat", "provider": "lambda_ai", "base_model": "qwen2.5-coder-32b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000001}, "qwen3-30b-a3b" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-30b-a3b", "max_input_tokens": 129024, "max_output_tokens": 16384}, "qwen3-32b-fp8" : {"mode": "chat", "provider": "lambda_ai", "base_model": "qwen3-32b-fp8", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.0000001}, "qwen3-8b" : {"mode": "chat", "provider": "llamagate", "base_model": "qwen3-8b", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000014}, "qwen3-coder-flash" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-coder-flash", "max_input_tokens": 997952, "max_output_tokens": 65536}, "qwen3-coder-flash-2025-07-28" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-coder-flash", "max_input_tokens": 997952, "max_output_tokens": 65536}, "qwen3-coder-plus" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-coder-plus", "max_input_tokens": 997952, "max_output_tokens": 65536}, "qwen3-coder-plus-2025-07-22" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-coder-plus", "max_input_tokens": 997952, "max_output_tokens": 65536}, "qwen3-coder:480b-cloud" : {"mode": "chat", "provider": "ollama", "base_model": "qwen3-coder-480b", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0, "output_cost_per_token": 0}, "qwen3-embedding-8b" : {"mode": "embedding", "provider": "llamagate", "base_model": "qwen3-embedding-8b", "max_input_tokens": 40960, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0}, "qwen3-max" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-max", "max_input_tokens": 258048, "max_output_tokens": 65536}, "qwen3-max-2026-01-23" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-max", "max_input_tokens": 258048, "max_output_tokens": 65536}, "qwen3-max-preview" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-max", "max_input_tokens": 258048, "max_output_tokens": 65536}, "qwen3-next-80b-a3b-instruct" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-next-80b-a3b-instruct", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000012}, "qwen3-next-80b-a3b-thinking" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-next-80b-a3b-thinking", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000012}, "qwen3-vl-235b-a22b-instruct" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-vl-235b-a22b-instruct", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000016}, "qwen3-vl-235b-a22b-thinking" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-vl-235b-a22b-thinking", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000004}, "qwen3-vl-32b-instruct" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-vl-32b-instruct", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000016, "output_cost_per_token": 0.00000064}, "qwen3-vl-32b-thinking" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-vl-32b-thinking", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.00000016, "output_cost_per_token": 0.00000287}, "qwen3-vl-8b" : {"mode": "chat", "provider": "llamagate", "base_model": "qwen3-vl-8b", "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000055}, "qwen3-vl-plus" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3-vl-plus", "max_input_tokens": 260096, "max_output_tokens": 32768}, "qwen3.5-plus" : {"mode": "chat", "provider": "dashscope", "base_model": "qwen3.5-plus", "max_input_tokens": 991808, "max_output_tokens": 65536}, "qwq-plus" : {"mode": "chat", "provider": "dashscope", "base_model": "qwq-plus", "max_input_tokens": 98304, "max_output_tokens": 8192, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000024}, "ranking/nvidia/llama-3.2-nv-rerankqa-1b-v2" : {"mode": "rerank", "provider": "nvidia_nim", "base_model": "ranking/nvidia/llama-3.2-nv-rerankqa-1b-v2", "input_cost_per_token": 0, "output_cost_per_token": 0}, "recraft-ai/recraft-v3" : {"mode": "image_generation", "provider": "replicate", "base_model": "recraft-ai/recraft-v3", "output_cost_per_image": 0.04}, "recraftv2" : {"mode": "image_generation", "provider": "recraft", "base_model": "recraftv2", "output_cost_per_image": 0.022}, "recraftv3" : {"mode": "image_generation", "provider": "recraft", "base_model": "recraftv3", "output_cost_per_image": 0.04}, "reka-core" : {"mode": "chat", "provider": "snowflake", "base_model": "reka-core", "max_input_tokens": 32000, "max_output_tokens": 8192}, "reka-flash" : {"mode": "chat", "provider": "snowflake", "base_model": "reka-flash", "max_input_tokens": 100000, "max_output_tokens": 8192}, "rekaai/reka-edge" : {"mode": "chat", "provider": "openrouter", "base_model": "reka-edge", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "rekaai/reka-flash-3" : {"mode": "chat", "provider": "openrouter", "base_model": "reka-flash-3", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000002}, "relace/relace-apply-3" : {"mode": "chat", "provider": "openrouter", "base_model": "relace-apply-3", "max_input_tokens": 256000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000085, "output_cost_per_token": 0.00000125}, "relace/relace-search" : {"mode": "chat", "provider": "openrouter", "base_model": "relace-search", "max_input_tokens": 256000, "max_output_tokens": 128000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003}, "remove-background" : {"mode": "image_edit", "provider": "stability", "base_model": "remove-background", "output_cost_per_image": 0.005}, "replace-background-and-relight" : {"mode": "image_edit", "provider": "stability", "base_model": "replace-background-and-relight", "output_cost_per_image": 0.008}, "rerank-2" : {"mode": "rerank", "provider": "voyage", "base_model": "rerank-2", "max_input_tokens": 16000, "max_output_tokens": 16000, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0}, "rerank-2-lite" : {"mode": "rerank", "provider": "voyage", "base_model": "rerank-2-lite", "max_input_tokens": 8000, "max_output_tokens": 8000, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0}, "rerank-2.5" : {"mode": "rerank", "provider": "voyage", "base_model": "rerank-2.5", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0}, "rerank-2.5-lite" : {"mode": "rerank", "provider": "voyage", "base_model": "rerank-2.5-lite", "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0}, "rerank-english-v2.0" : {"mode": "rerank", "provider": "cohere", "base_model": "rerank-english", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "rerank-english-v3.0" : {"mode": "rerank", "provider": "cohere", "base_model": "rerank-english", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "rerank-multilingual-v2.0" : {"mode": "rerank", "provider": "cohere", "base_model": "rerank-multilingual", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "rerank-multilingual-v3.0" : {"mode": "rerank", "provider": "cohere", "base_model": "rerank-multilingual", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "rerank-v3.5" : {"mode": "rerank", "provider": "cohere", "base_model": "rerank", "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "runwayml/gen4-turbo" : {"mode": "video_generation", "provider": "replicate", "base_model": "gen4-turbo", "output_cost_per_video_per_second": 0.05}, "sa-east-1/deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000074, "output_cost_per_token": 0.00000222}, "sa-east-1/meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000445, "output_cost_per_token": 0.00000588}, "sa-east-1/meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.00000101}, "sa-east-1/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "sa-east-1/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000144}, "sa-east-1/moonshotai.kimi-k2-thinking" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000073, "output_cost_per_token": 0.00000303}, "sa-east-1/moonshotai.kimi-k2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.0000036}, "sa-east-1/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.00000144}, "sao10k/l3-70b-euryale-v2.1" : {"mode": "chat", "provider": "novita", "base_model": "l3-70b-euryale", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000148, "output_cost_per_token": 0.00000148}, "sao10k/l3-8b-lunaris" : {"mode": "chat", "provider": "novita", "base_model": "l3-8b-lunaris", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000005}, "sao10k/l3-euryale-70b" : {"mode": "chat", "provider": "openrouter", "base_model": "l3-euryale-70b", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000148, "output_cost_per_token": 0.00000148}, "sao10k/l3-lunaris-8b" : {"mode": "chat", "provider": "openrouter", "base_model": "l3-lunaris-8b", "max_input_tokens": 8192, "max_output_tokens": 16384, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000005}, "sao10k/l3.1-70b-hanami-x1" : {"mode": "chat", "provider": "openrouter", "base_model": "l3.1-70b-hanami-x1", "max_input_tokens": 16000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000003}, "sao10k/l3.1-euryale-70b" : {"mode": "chat", "provider": "openrouter", "base_model": "l3.1-euryale-70b", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.00000085, "output_cost_per_token": 0.00000085}, "sao10k/l3.3-euryale-70b" : {"mode": "chat", "provider": "openrouter", "base_model": "l3.3-euryale-70b", "max_input_tokens": 131072, "max_output_tokens": 16384, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000075}, "sao10k/l31-70b-euryale-v2.2" : {"mode": "chat", "provider": "novita", "base_model": "l31-70b-euryale", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000148, "output_cost_per_token": 0.00000148}, "sarvam-m" : {"mode": "chat", "provider": "sarvam", "base_model": "sarvam-m", "max_input_tokens": 8192, "max_output_tokens": 32000, "input_cost_per_token": 0, "output_cost_per_token": 0, "cache_read_input_token_cost": 0, "cache_creation_input_token_cost": 0, "cache_creation_input_token_cost_above_1hr": 0}, "scribe_v1" : {"mode": "audio_transcription", "provider": "elevenlabs", "base_model": "scribe-v1", "input_cost_per_second": 0.0000611, "output_cost_per_second": 0}, "scribe_v1_experimental" : {"mode": "audio_transcription", "provider": "elevenlabs", "base_model": "scribe-v1", "input_cost_per_second": 0.0000611, "output_cost_per_second": 0}, "sd3" : {"mode": "image_generation", "provider": "stability", "base_model": "sd3", "output_cost_per_image": 0.065}, "sd3-large" : {"mode": "image_generation", "provider": "stability", "base_model": "sd3-large", "output_cost_per_image": 0.065}, "sd3-large-turbo" : {"mode": "image_generation", "provider": "stability", "base_model": "sd3-large-turbo", "output_cost_per_image": 0.04}, "sd3-medium" : {"mode": "image_generation", "provider": "stability", "base_model": "sd3-medium", "output_cost_per_image": 0.035}, "sd3.5-large" : {"mode": "image_generation", "provider": "stability", "base_model": "sd3.5-large", "output_cost_per_image": 0.065}, "sd3.5-large-turbo" : {"mode": "image_generation", "provider": "stability", "base_model": "sd3.5-large-turbo", "output_cost_per_image": 0.04}, "sd3.5-medium" : {"mode": "image_generation", "provider": "stability", "base_model": "sd3.5-medium", "output_cost_per_image": 0.035}, "sdaia/allam-1-13b-instruct" : {"mode": "chat", "provider": "watsonx", "base_model": "allam-1-13b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000018, "output_cost_per_token": 0.0000018}, "search" : {"mode": "search", "provider": "dataforseo", "base_model": "search"}, "search-advanced" : {"mode": "search", "provider": "tavily", "base_model": "search-advanced"}, "search-and-recolor" : {"mode": "image_edit", "provider": "stability", "base_model": "search-and-recolor", "output_cost_per_image": 0.005}, "search-and-replace" : {"mode": "image_edit", "provider": "stability", "base_model": "search-and-replace", "output_cost_per_image": 0.005}, "search-deep" : {"mode": "search", "provider": "linkup", "base_model": "search-deep"}, "search-pro" : {"mode": "search", "provider": "parallel_ai", "base_model": "search-pro"}, "search_api" : {"mode": "vector_store", "provider": "vertex", "base_model": "search-api"}, "sentence-transformers/all-minilm-l12-v2" : {"mode": "chat", "provider": "openrouter", "base_model": "all-minilm-l12-v2", "max_input_tokens": 512, "input_cost_per_token": 0.000000005}, "sentence-transformers/all-minilm-l6-v2" : {"mode": "chat", "provider": "openrouter", "base_model": "all-minilm-l6-v2", "max_input_tokens": 512, "input_cost_per_token": 0.000000005}, "sentence-transformers/all-mpnet-base-v2" : {"mode": "chat", "provider": "openrouter", "base_model": "all-mpnet-base-v2", "max_input_tokens": 512, "input_cost_per_token": 0.000000005}, "sentence-transformers/multi-qa-mpnet-base-dot-v1" : {"mode": "chat", "provider": "openrouter", "base_model": "multi-qa-mpnet-base-dot-v1", "max_input_tokens": 512, "input_cost_per_token": 0.000000005}, "sentence-transformers/paraphrase-minilm-l6-v2" : {"mode": "chat", "provider": "openrouter", "base_model": "paraphrase-minilm-l6-v2", "max_input_tokens": 512, "input_cost_per_token": 0.000000005}, "sesame/csm-1b" : {"mode": "chat", "provider": "openrouter", "base_model": "csm-1b", "max_input_tokens": 4096, "input_cost_per_token": 0.000007}, "sketch" : {"mode": "image_edit", "provider": "stability", "base_model": "sketch", "output_cost_per_image": 0.005}, "skywork/r1v4-lite" : {"mode": "chat", "provider": "novita", "base_model": "r1v4-lite", "max_input_tokens": 262144, "max_output_tokens": 65536, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006}, "snowflake-arctic" : {"mode": "chat", "provider": "snowflake", "base_model": "snowflake-arctic", "max_input_tokens": 4096, "max_output_tokens": 8192}, "snowflake-llama-3.1-405b" : {"mode": "chat", "provider": "snowflake", "base_model": "snowflake-llama-3.1-405b", "max_input_tokens": 8000, "max_output_tokens": 8192}, "snowflake-llama-3.3-70b" : {"mode": "chat", "provider": "snowflake", "base_model": "snowflake-llama-3.3-70b", "max_input_tokens": 8000, "max_output_tokens": 8192}, "sonar-deep-research" : {"mode": "chat", "provider": "perplexity", "base_model": "sonar", "max_input_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "sonar-medium-chat" : {"mode": "chat", "provider": "perplexity", "base_model": "sonar-medium-chat", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000018}, "sonar-medium-online" : {"mode": "chat", "provider": "perplexity", "base_model": "sonar-medium-online", "max_input_tokens": 12000, "max_output_tokens": 12000, "input_cost_per_token": 0, "output_cost_per_token": 0.0000018}, "sonar-pro" : {"mode": "chat", "provider": "perplexity", "base_model": "sonar-pro", "max_input_tokens": 200000, "max_output_tokens": 8000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "sonar-reasoning" : {"mode": "chat", "provider": "perplexity", "base_model": "sonar", "max_input_tokens": 128000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005}, "sonar-reasoning-pro" : {"mode": "chat", "provider": "perplexity", "base_model": "sonar-reasoning-pro", "max_input_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008}, "sonar-small-chat" : {"mode": "chat", "provider": "perplexity", "base_model": "sonar-small-chat", "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028}, "sonar-small-online" : {"mode": "chat", "provider": "perplexity", "base_model": "sonar-small-online", "max_input_tokens": 12000, "max_output_tokens": 12000, "input_cost_per_token": 0, "output_cost_per_token": 0.00000028}, "sora-2" : {"mode": "video_generation", "provider": "openai", "base_model": "sora-2", "output_cost_per_video_per_second": 0.1}, "sora-2-pro" : {"mode": "video_generation", "provider": "azure", "base_model": "sora-2-pro", "output_cost_per_video_per_second": 0.3}, "sora-2-pro-high-res" : {"mode": "video_generation", "provider": "openai", "base_model": "sora-2-pro", "output_cost_per_video_per_second": 0.5}, "speech-02-hd" : {"mode": "audio_speech", "provider": "minimax", "base_model": "speech-02-hd", "input_cost_per_character": 0.0001}, "speech-02-turbo" : {"mode": "audio_speech", "provider": "minimax", "base_model": "speech-02-turbo", "input_cost_per_character": 0.00006}, "speech-2.6-hd" : {"mode": "audio_speech", "provider": "minimax", "base_model": "speech-2.6-hd", "input_cost_per_character": 0.0001}, "speech-2.6-turbo" : {"mode": "audio_speech", "provider": "minimax", "base_model": "speech-2.6-turbo", "input_cost_per_character": 0.00006}, "speech/azure-stt" : {"mode": "audio_transcription", "provider": "azure", "base_model": "speech/azure-stt", "input_cost_per_second": 0.0002777778, "output_cost_per_second": 0}, "speech/azure-tts" : {"mode": "audio_speech", "provider": "azure", "base_model": "speech/azure-tts", "input_cost_per_character": 0.000015}, "speech/azure-tts-hd" : {"mode": "audio_speech", "provider": "azure", "base_model": "speech/azure-tts-hd", "input_cost_per_character": 0.00003}, "stability-ai/stable-diffusion-3.5-large" : {"mode": "image_generation", "provider": "replicate", "base_model": "stability-ai/stable-diffusion-3.5-large", "output_cost_per_image": 0.065}, "stability-ai/stable-diffusion-3.5-medium" : {"mode": "image_generation", "provider": "replicate", "base_model": "stability-ai/stable-diffusion-3.5-medium", "output_cost_per_image": 0.035}, "stability.sd3-5-large-v1:0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "sd3-5-large", "max_input_tokens": 77, "output_cost_per_image": 0.08}, "stability.sd3-large-v1:0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "sd3-large", "max_input_tokens": 77, "output_cost_per_image": 0.08}, "stability.stable-conservative-upscale-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-conservative-upscale", "max_input_tokens": 77, "output_cost_per_image": 0.4}, "stability.stable-creative-upscale-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-creative-upscale", "max_input_tokens": 77, "output_cost_per_image": 0.6}, "stability.stable-fast-upscale-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-fast-upscale", "max_input_tokens": 77, "output_cost_per_image": 0.03}, "stability.stable-image-control-sketch-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-image-control-sketch", "max_input_tokens": 77, "output_cost_per_image": 0.07}, "stability.stable-image-control-structure-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-image-control-structure", "max_input_tokens": 77, "output_cost_per_image": 0.07}, "stability.stable-image-core-v1:0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "stable-image-core", "max_input_tokens": 77, "output_cost_per_image": 0.04}, "stability.stable-image-core-v1:1" : {"mode": "image_generation", "provider": "bedrock", "base_model": "stable-image-core", "max_input_tokens": 77, "output_cost_per_image": 0.04}, "stability.stable-image-erase-object-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-image-erase-object", "max_input_tokens": 77, "output_cost_per_image": 0.07}, "stability.stable-image-inpaint-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-image-inpaint", "max_input_tokens": 77, "output_cost_per_image": 0.07}, "stability.stable-image-remove-background-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-image-remove-background", "max_input_tokens": 77, "output_cost_per_image": 0.07}, "stability.stable-image-search-recolor-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-image-search-recolor", "max_input_tokens": 77, "output_cost_per_image": 0.07}, "stability.stable-image-search-replace-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-image-search-replace", "max_input_tokens": 77, "output_cost_per_image": 0.07}, "stability.stable-image-style-guide-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-image-style-guide", "max_input_tokens": 77, "output_cost_per_image": 0.07}, "stability.stable-image-ultra-v1:0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "stable-image-ultra", "max_input_tokens": 77, "output_cost_per_image": 0.14}, "stability.stable-image-ultra-v1:1" : {"mode": "image_generation", "provider": "bedrock", "base_model": "stable-image-ultra", "max_input_tokens": 77, "output_cost_per_image": 0.14}, "stability.stable-outpaint-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-outpaint", "max_input_tokens": 77, "output_cost_per_image": 0.06}, "stability.stable-style-transfer-v1:0" : {"mode": "image_edit", "provider": "bedrock", "base_model": "stable-style-transfer", "max_input_tokens": 77, "output_cost_per_image": 0.08}, "stabilityai/stable-diffusion-xl-base-1.0" : {"mode": "image_generation", "provider": "nscale", "base_model": "stable-diffusion-xl-base-1.0", "input_cost_per_pixel": 0.000000003, "output_cost_per_pixel": 0}, "stable-image-core" : {"mode": "image_generation", "provider": "stability", "base_model": "stable-image-core", "output_cost_per_image": 0.03}, "stable-image-ultra" : {"mode": "image_generation", "provider": "stability", "base_model": "stable-image-ultra", "output_cost_per_image": 0.08}, "standard" : {"mode": "audio_speech", "provider": "aws_polly", "base_model": "standard", "input_cost_per_character": 0.000004}, "standard/1024-x-1024/dall-e-2" : {"mode": "image_generation", "provider": "azure", "base_model": "dall-e-2", "input_cost_per_pixel": 0, "output_cost_per_token": 0}, "standard/1024-x-1024/dall-e-3" : {"mode": "image_generation", "provider": "azure", "base_model": "dall-e-3", "input_cost_per_pixel": 0.0000000381469, "output_cost_per_token": 0}, "standard/1024-x-1792/dall-e-3" : {"mode": "image_generation", "provider": "azure", "base_model": "dall-e-3", "input_cost_per_pixel": 0.00000004359, "output_cost_per_token": 0}, "standard/1792-x-1024/dall-e-3" : {"mode": "image_generation", "provider": "azure", "base_model": "dall-e-3", "input_cost_per_pixel": 0.00000004359, "output_cost_per_token": 0}, "stepfun/step-3.5-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "step-3.5-flash", "max_input_tokens": 262144, "max_output_tokens": 16384, "input_cost_per_token": 0.00000009, "output_cost_per_token": 0.0000003, "cache_read_input_token_cost": 0.00000002}, "stepfun/step-3.7-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "step-3.7-flash", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.00000115, "cache_read_input_token_cost": 0.00000004}, "structure" : {"mode": "image_edit", "provider": "stability", "base_model": "structure", "output_cost_per_image": 0.005}, "style" : {"mode": "image_edit", "provider": "stability", "base_model": "style", "output_cost_per_image": 0.005}, "style-transfer" : {"mode": "image_edit", "provider": "stability", "base_model": "style-transfer", "output_cost_per_image": 0.008}, "swiss-ai/apertus-70b-instruct" : {"mode": "chat", "provider": "publicai", "base_model": "apertus-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "swiss-ai/apertus-8b-instruct" : {"mode": "chat", "provider": "publicai", "base_model": "apertus-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0, "output_cost_per_token": 0}, "switchpoint/router" : {"mode": "chat", "provider": "openrouter", "base_model": "router", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000085, "output_cost_per_token": 0.0000034}, "tencent/hunyuan-a13b-instruct" : {"mode": "chat", "provider": "openrouter", "base_model": "hunyuan-a13b-instruct", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.00000057}, "tencent/hy3-preview" : {"mode": "chat", "provider": "openrouter", "base_model": "hy3-preview", "max_input_tokens": 262144, "input_cost_per_token": 0.000000063, "output_cost_per_token": 0.00000021, "cache_read_input_token_cost": 0.000000021}, "text-bison" : {"mode": "completion", "provider": "palm", "base_model": "text-bison", "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125}, "text-bison-001" : {"mode": "completion", "provider": "palm", "base_model": "text-bison-001", "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125}, "text-bison-safety-off" : {"mode": "completion", "provider": "palm", "base_model": "text-bison-safety-off", "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125}, "text-bison-safety-recitation-off" : {"mode": "completion", "provider": "palm", "base_model": "text-bison-safety-recitation-off", "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125}, "text-embedding-004" : {"mode": "embedding", "provider": "vertex", "base_model": "text-embedding-004", "max_input_tokens": 2048, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "input_cost_per_character": 0.000000025}, "text-embedding-005" : {"mode": "embedding", "provider": "vertex", "base_model": "text-embedding-005", "max_input_tokens": 2048, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "input_cost_per_character": 0.000000025}, "text-embedding-3-large" : {"mode": "embedding", "provider": "azure", "base_model": "text-embedding-3-large", "max_input_tokens": 8191, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0}, "text-embedding-3-small" : {"mode": "embedding", "provider": "openai", "base_model": "text-embedding-3-small", "max_input_tokens": 8191, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0, "input_cost_per_token_batches": 0.00000001, "output_cost_per_token_batches": 0}, "text-embedding-3-small-inference" : {"mode": "embedding", "provider": "github_copilot", "base_model": "text-embedding-3-small-inference", "max_input_tokens": 8191}, "text-embedding-ada-002" : {"mode": "embedding", "provider": "azure", "base_model": "text-embedding-ada-002", "max_input_tokens": 8191, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "text-embedding-ada-002-v2" : {"mode": "embedding", "provider": "openai", "base_model": "text-embedding-ada-002", "max_input_tokens": 8191, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "input_cost_per_token_batches": 0.00000005, "output_cost_per_token_batches": 0}, "text-embedding-large-exp-03-07" : {"mode": "embedding", "provider": "vertex", "base_model": "text-embedding-large", "max_input_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "input_cost_per_character": 0.000000025}, "text-embedding-preview-0409" : {"mode": "embedding", "provider": "vertex", "base_model": "text-embedding", "max_input_tokens": 3072, "input_cost_per_token": 0.00000000625, "output_cost_per_token": 0}, "text-moderation-007" : {"mode": "moderation", "provider": "openai", "base_model": "text-moderation-007", "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0, "output_cost_per_token": 0}, "text-moderation-latest" : {"mode": "moderation", "provider": "openai", "base_model": "text-moderation", "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0, "output_cost_per_token": 0}, "text-moderation-stable" : {"mode": "moderation", "provider": "openai", "base_model": "text-moderation-stable", "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0, "output_cost_per_token": 0}, "text-multilingual-embedding-002" : {"mode": "embedding", "provider": "vertex", "base_model": "text-multilingual-embedding-002", "max_input_tokens": 2048, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "input_cost_per_character": 0.000000025}, "text-unicorn" : {"mode": "completion", "provider": "vertex", "base_model": "text-unicorn", "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.000028}, "text-unicorn@001" : {"mode": "completion", "provider": "vertex", "base_model": "text-unicorn", "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.000028}, "thedrummer/cydonia-24b-v4.1" : {"mode": "chat", "provider": "openrouter", "base_model": "cydonia-24b-v4.1", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000005, "cache_read_input_token_cost": 0.00000015}, "thedrummer/rocinante-12b" : {"mode": "chat", "provider": "openrouter", "base_model": "rocinante-12b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000017, "output_cost_per_token": 0.00000043}, "thedrummer/skyfall-36b-v2" : {"mode": "chat", "provider": "openrouter", "base_model": "skyfall-36b-v2", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000055, "output_cost_per_token": 0.0000008, "cache_read_input_token_cost": 0.00000025}, "thedrummer/unslopnemo-12b" : {"mode": "chat", "provider": "openrouter", "base_model": "unslopnemo-12b", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000004}, "thenlper/gte-base" : {"mode": "embedding", "provider": "fireworks", "base_model": "gte-base", "max_input_tokens": 512, "input_cost_per_token": 0.000000008, "output_cost_per_token": 0}, "thenlper/gte-large" : {"mode": "embedding", "provider": "fireworks", "base_model": "gte-large", "max_input_tokens": 512, "input_cost_per_token": 0.000000016, "output_cost_per_token": 0}, "together-ai-21.1b-41b" : {"mode": "chat", "provider": "together_ai", "base_model": "together-ai-21.1b-41b", "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000008}, "together-ai-4.1b-8b" : {"mode": "chat", "provider": "together_ai", "base_model": "together-ai-4.1b-8b", "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002}, "together-ai-41.1b-80b" : {"mode": "chat", "provider": "together_ai", "base_model": "together-ai-41.1b-80b", "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009}, "together-ai-8.1b-21b" : {"mode": "chat", "provider": "together_ai", "base_model": "together-ai-8.1b-21b", "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000003}, "together-ai-81.1b-110b" : {"mode": "chat", "provider": "together_ai", "base_model": "together-ai-81.1b-110b", "input_cost_per_token": 0.0000018, "output_cost_per_token": 0.0000018}, "together-ai-embedding-151m-to-350m" : {"mode": "embedding", "provider": "together_ai", "base_model": "together-ai-embedding-151m-to-350m", "input_cost_per_token": 0.000000016, "output_cost_per_token": 0}, "together-ai-embedding-up-to-150m" : {"mode": "embedding", "provider": "together_ai", "base_model": "together-ai-embedding-up-to-150m", "input_cost_per_token": 0.000000008, "output_cost_per_token": 0}, "together-ai-up-to-4b" : {"mode": "chat", "provider": "together_ai", "base_model": "together-ai-up-to-4b", "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "togethercomputer/CodeLlama-34b-Instruct" : {"mode": "chat", "provider": "together_ai", "base_model": "codellama-34b-instruct"}, "tts-1" : {"mode": "audio_speech", "provider": "azure", "base_model": "tts-1", "input_cost_per_character": 0.000015}, "tts-1-1106" : {"mode": "audio_speech", "provider": "openai", "base_model": "tts-1", "input_cost_per_character": 0.000015}, "tts-1-hd" : {"mode": "audio_speech", "provider": "azure", "base_model": "tts-1-hd", "input_cost_per_character": 0.00003}, "tts-1-hd-1106" : {"mode": "audio_speech", "provider": "openai", "base_model": "tts-1-hd", "input_cost_per_character": 0.00003}, "twelvelabs.marengo-embed-2-7-v1:0" : {"mode": "embedding", "provider": "bedrock", "base_model": "marengo-embed-2-7", "max_input_tokens": 77, "input_cost_per_token": 0.00007, "output_cost_per_token": 0}, "twelvelabs.pegasus-1-2-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "pegasus-1-2", "output_cost_per_token": 0.0000075, "input_cost_per_video_per_second": 0.00049}, "undi95/remm-slerp-l2-13b" : {"mode": "chat", "provider": "openrouter", "base_model": "remm-slerp-l2-13b", "max_input_tokens": 6144, "max_output_tokens": 4096, "input_cost_per_token": 0.000001875, "output_cost_per_token": 0.000001875}, "upstage/solar-pro-3" : {"mode": "chat", "provider": "openrouter", "base_model": "solar-pro-3", "max_input_tokens": 128000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "cache_read_input_token_cost": 0.000000015}, "us-east-1/1-month-commitment/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.011, "output_cost_per_second": 0.011}, "us-east-1/1-month-commitment/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175}, "us-east-1/1-month-commitment/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175}, "us-east-1/6-month-commitment/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00611, "output_cost_per_second": 0.00611}, "us-east-1/6-month-commitment/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972}, "us-east-1/6-month-commitment/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972}, "us-east-1/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000024}, "us-east-1/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "us-east-1/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "us-east-1/deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000062, "output_cost_per_token": 0.00000185}, "us-east-1/meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000265, "output_cost_per_token": 0.0000035}, "us-east-1/meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006}, "us-east-1/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "us-east-1/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "us-east-1/mistral.mistral-7b-instruct-v0:2" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000002}, "us-east-1/mistral.mistral-large-2402-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-large", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "us-east-1/mistral.mixtral-8x7b-instruct-v0:1" : {"mode": "chat", "provider": "bedrock", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000007}, "us-east-1/moonshotai.kimi-k2-thinking" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "us-east-1/moonshotai.kimi-k2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000003}, "us-east-1/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000012}, "us-east-1/zai.glm-5" : {"mode": "chat", "provider": "bedrock", "base_model": "zai.glm-5", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.0000032}, "us-east-2/deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000062, "output_cost_per_token": 0.00000185}, "us-east-2/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "us-east-2/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "us-east-2/moonshotai.kimi-k2-thinking" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "us-east-2/moonshotai.kimi-k2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000003}, "us-east-2/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000012}, "us-gov-east-1/amazon.nova-pro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-pro", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.00000096, "output_cost_per_token": 0.00000384}, "us-gov-east-1/amazon.titan-embed-text-v1" : {"mode": "embedding", "provider": "bedrock", "base_model": "titan-embed-text-v1", "max_input_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "us-gov-east-1/amazon.titan-embed-text-v2:0" : {"mode": "embedding", "provider": "bedrock", "base_model": "titan-embed-text", "max_input_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0}, "us-gov-east-1/amazon.titan-text-express-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "titan-text-express-v1", "max_input_tokens": 42000, "max_output_tokens": 8000, "input_cost_per_token": 0.0000013, "output_cost_per_token": 0.0000017}, "us-gov-east-1/amazon.titan-text-lite-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "titan-text-lite-v1", "max_input_tokens": 42000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000004}, "us-gov-east-1/amazon.titan-text-premier-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "titan-text-premier", "max_input_tokens": 42000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "us-gov-east-1/anthropic.claude-3-5-sonnet-20240620-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000036, "output_cost_per_token": 0.000018, "cache_read_input_token_cost": 0.00000036, "cache_creation_input_token_cost": 0.0000045}, "us-gov-east-1/anthropic.claude-3-haiku-20240307-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000015, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.000000375}, "us-gov-east-1/anthropic.claude-haiku-4-5-20251001-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.00000012, "cache_creation_input_token_cost": 0.0000015}, "us-gov-east-1/anthropic.claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125}, "us-gov-east-1/claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125}, "us-gov-east-1/meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000265, "output_cost_per_token": 0.0000035}, "us-gov-east-1/meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8000, "max_output_tokens": 2048, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.00000265}, "us-gov-west-1/amazon.nova-pro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-pro", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.00000096, "output_cost_per_token": 0.00000384}, "us-gov-west-1/amazon.titan-embed-text-v1" : {"mode": "embedding", "provider": "bedrock", "base_model": "titan-embed-text-v1", "max_input_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "us-gov-west-1/amazon.titan-embed-text-v2:0" : {"mode": "embedding", "provider": "bedrock", "base_model": "titan-embed-text", "max_input_tokens": 8192, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0}, "us-gov-west-1/amazon.titan-text-express-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "titan-text-express-v1", "max_input_tokens": 42000, "max_output_tokens": 8000, "input_cost_per_token": 0.0000013, "output_cost_per_token": 0.0000017}, "us-gov-west-1/amazon.titan-text-lite-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "titan-text-lite-v1", "max_input_tokens": 42000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000004}, "us-gov-west-1/amazon.titan-text-premier-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "titan-text-premier", "max_input_tokens": 42000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015}, "us-gov-west-1/anthropic.claude-3-5-sonnet-20240620-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000036, "output_cost_per_token": 0.000018, "cache_read_input_token_cost": 0.00000036, "cache_creation_input_token_cost": 0.0000045}, "us-gov-west-1/anthropic.claude-3-7-sonnet-20250219-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000036, "output_cost_per_token": 0.000018, "cache_read_input_token_cost": 0.00000036, "cache_creation_input_token_cost": 0.0000045}, "us-gov-west-1/anthropic.claude-3-haiku-20240307-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000015, "cache_read_input_token_cost": 0.00000003, "cache_creation_input_token_cost": 0.000000375}, "us-gov-west-1/anthropic.claude-haiku-4-5-20251001-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.00000012, "cache_creation_input_token_cost": 0.0000015}, "us-gov-west-1/anthropic.claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125}, "us-gov-west-1/claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125}, "us-gov-west-1/meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000265, "output_cost_per_token": 0.0000035}, "us-gov-west-1/meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8000, "max_output_tokens": 2048, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.00000265}, "us-gov.anthropic.claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125, "input_cost_per_token_above_200k_tokens": 0.0000066, "output_cost_per_token_above_200k_tokens": 0.00002475, "cache_read_input_token_cost_above_200k_tokens": 0.00000066, "cache_creation_input_token_cost_above_200k_tokens": 0.00000825}, "us-west-1/meta.llama3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-70b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000265, "output_cost_per_token": 0.0000035}, "us-west-1/meta.llama3-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-8b-instruct", "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006}, "us-west-2/1-month-commitment/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.011, "output_cost_per_second": 0.011}, "us-west-2/1-month-commitment/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175}, "us-west-2/1-month-commitment/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175}, "us-west-2/6-month-commitment/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00611, "output_cost_per_second": 0.00611}, "us-west-2/6-month-commitment/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972}, "us-west-2/6-month-commitment/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972}, "us-west-2/anthropic.claude-instant-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-instant-v1", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000024}, "us-west-2/anthropic.claude-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "us-west-2/anthropic.claude-v2:1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude", "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "us-west-2/deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000062, "output_cost_per_token": 0.00000185}, "us-west-2/minimax.minimax-m2.1" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.1", "max_input_tokens": 196000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "us-west-2/minimax.minimax-m2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "minimax-m2.5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012}, "us-west-2/mistral.mistral-7b-instruct-v0:2" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000002}, "us-west-2/mistral.mistral-large-2402-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "mistral-large", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024}, "us-west-2/mistral.mixtral-8x7b-instruct-v0:1" : {"mode": "chat", "provider": "bedrock", "base_model": "mixtral-8x7b-instruct", "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000007}, "us-west-2/moonshotai.kimi-k2-thinking" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2-thinking", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000025}, "us-west-2/moonshotai.kimi-k2.5" : {"mode": "chat", "provider": "bedrock", "base_model": "kimi-k2.5", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000003}, "us-west-2/qwen.qwen3-coder-next" : {"mode": "chat", "provider": "bedrock", "base_model": "qwen3-coder-next", "max_input_tokens": 262144, "max_output_tokens": 8192, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000012}, "us-west-2/zai.glm-5" : {"mode": "chat", "provider": "bedrock", "base_model": "zai.glm-5", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.0000032}, "us.amazon.nova-2-lite-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-2-lite", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.00000033, "output_cost_per_token": 0.00000275, "cache_read_input_token_cost": 0.0000000825}, "us.amazon.nova-2-pro-preview-20251202-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-2-pro", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000021875, "output_cost_per_token": 0.0000175, "input_cost_per_audio_token": 0.0000021875, "input_cost_per_image_token": 0.0000021875, "cache_read_input_token_cost": 0.000000546875}, "us.amazon.nova-canvas-v1:0" : {"mode": "image_generation", "provider": "bedrock", "base_model": "nova-canvas", "max_input_tokens": 2600, "output_cost_per_image": 0.06}, "us.amazon.nova-lite-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-lite", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000024}, "us.amazon.nova-micro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-micro", "max_input_tokens": 128000, "max_output_tokens": 10000, "input_cost_per_token": 0.000000035, "output_cost_per_token": 0.00000014}, "us.amazon.nova-premier-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-premier", "max_input_tokens": 1000000, "max_output_tokens": 10000, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.0000125}, "us.amazon.nova-pro-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "nova-pro", "max_input_tokens": 300000, "max_output_tokens": 10000, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000032}, "us.anthropic.claude-3-5-haiku-20241022-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-haiku", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.000004, "cache_read_input_token_cost": 0.00000008, "cache_creation_input_token_cost": 0.000001}, "us.anthropic.claude-3-5-sonnet-20240620-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "us.anthropic.claude-3-5-sonnet-20241022-v2:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-5-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "us.anthropic.claude-3-7-sonnet-20250219-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-7-sonnet", "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "us.anthropic.claude-3-haiku-20240307-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-haiku", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "cache_read_input_token_cost": 0.000000025, "cache_creation_input_token_cost": 0.0000003125}, "us.anthropic.claude-3-opus-20240229-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-opus", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "us.anthropic.claude-3-sonnet-20240229-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-3-sonnet", "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "us.anthropic.claude-haiku-4-5-20251001-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-haiku-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000055, "cache_read_input_token_cost": 0.00000011, "cache_creation_input_token_cost": 0.000001375, "cache_creation_input_token_cost_above_1hr": 0.0000022}, "us.anthropic.claude-opus-4-1-20250805-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-1", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "us.anthropic.claude-opus-4-20250514-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_read_input_token_cost": 0.0000015, "cache_creation_input_token_cost": 0.00001875}, "us.anthropic.claude-opus-4-5-20251101-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.0000275, "cache_read_input_token_cost": 0.00000055, "cache_creation_input_token_cost": 0.000006875, "cache_creation_input_token_cost_above_1hr": 0.000011}, "us.anthropic.claude-opus-4-6-v1" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-6", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.0000275, "cache_read_input_token_cost": 0.00000055, "cache_creation_input_token_cost": 0.000006875}, "us.anthropic.claude-opus-4-7" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-7", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.0000275, "cache_read_input_token_cost": 0.00000055, "cache_creation_input_token_cost": 0.000006875, "cache_creation_input_token_cost_above_1hr": 0.000011}, "us.anthropic.claude-opus-4-8" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-opus-4-8", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625, "cache_creation_input_token_cost_above_1hr": 0.00001}, "us.anthropic.claude-sonnet-4-20250514-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375, "input_cost_per_token_above_200k_tokens": 0.000006, "output_cost_per_token_above_200k_tokens": 0.0000225, "cache_read_input_token_cost_above_200k_tokens": 0.0000006, "cache_creation_input_token_cost_above_200k_tokens": 0.0000075}, "us.anthropic.claude-sonnet-4-5-20250929-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-5", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125, "input_cost_per_token_above_200k_tokens": 0.0000066, "output_cost_per_token_above_200k_tokens": 0.00002475, "cache_creation_input_token_cost_above_1hr": 0.0000066, "cache_read_input_token_cost_above_200k_tokens": 0.00000066, "cache_creation_input_token_cost_above_200k_tokens": 0.00000825, "cache_creation_input_token_cost_above_1hr_above_200k_tokens": 0.0000132}, "us.anthropic.claude-sonnet-4-6" : {"mode": "chat", "provider": "bedrock", "base_model": "claude-sonnet-4-6", "max_input_tokens": 1000000, "max_output_tokens": 64000, "input_cost_per_token": 0.0000033, "output_cost_per_token": 0.0000165, "cache_read_input_token_cost": 0.00000033, "cache_creation_input_token_cost": 0.000004125}, "us.deepseek.r1-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek-r1", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000135, "output_cost_per_token": 0.0000054}, "us.deepseek.v3.2" : {"mode": "chat", "provider": "bedrock", "base_model": "deepseek", "max_input_tokens": 163840, "max_output_tokens": 163840, "input_cost_per_token": 0.00000062, "output_cost_per_token": 0.00000185}, "us.meta.llama3-1-405b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-1-405b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000532, "output_cost_per_token": 0.000016}, "us.meta.llama3-1-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-1-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000099, "output_cost_per_token": 0.00000099}, "us.meta.llama3-1-8b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-1-8b-instruct", "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000022}, "us.meta.llama3-2-11b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-11b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000035}, "us.meta.llama3-2-1b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-1b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "us.meta.llama3-2-3b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-3b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015}, "us.meta.llama3-2-90b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-2-90b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002}, "us.meta.llama3-3-70b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-3-3-70b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072}, "us.meta.llama4-maverick-17b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-4-maverick-17b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000024, "output_cost_per_token": 0.00000097, "input_cost_per_token_batches": 0.00000012, "output_cost_per_token_batches": 0.000000485}, "us.meta.llama4-scout-17b-instruct-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "llama-4-scout-17b-instruct", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000017, "output_cost_per_token": 0.00000066, "input_cost_per_token_batches": 0.000000085, "output_cost_per_token_batches": 0.00000033}, "us.mistral.pixtral-large-2502-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "pixtral-large", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006}, "us.twelvelabs.marengo-embed-2-7-v1:0" : {"mode": "embedding", "provider": "bedrock", "base_model": "marengo-embed-2-7", "max_input_tokens": 77, "input_cost_per_image": 0.0001, "input_cost_per_token": 0.00007, "output_cost_per_token": 0, "input_cost_per_audio_per_second": 0.00014, "input_cost_per_video_per_second": 0.0007}, "us.twelvelabs.pegasus-1-2-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "pegasus-1-2", "output_cost_per_token": 0.0000075, "input_cost_per_video_per_second": 0.00049}, "us.writer.palmyra-x4-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "palmyra-x4", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "us.writer.palmyra-x5-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "palmyra-x5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000006}, "us/gpt-4.1-2025-04-14" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4.1", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.0000022, "output_cost_per_token": 0.0000088, "cache_read_input_token_cost": 0.00000055, "input_cost_per_token_batches": 0.0000011, "output_cost_per_token_batches": 0.0000044}, "us/gpt-4.1-mini-2025-04-14" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4.1-mini", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.00000044, "output_cost_per_token": 0.00000176, "cache_read_input_token_cost": 0.00000011, "input_cost_per_token_batches": 0.00000022, "output_cost_per_token_batches": 0.00000088}, "us/gpt-4.1-nano-2025-04-14" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4.1-nano", "max_input_tokens": 1047576, "max_output_tokens": 32768, "input_cost_per_token": 0.00000011, "output_cost_per_token": 0.00000044, "cache_read_input_token_cost": 0.000000025, "input_cost_per_token_batches": 0.00000006, "output_cost_per_token_batches": 0.00000022}, "us/gpt-4o-2024-08-06" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000275, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.000001375}, "us/gpt-4o-2024-11-20" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000275, "output_cost_per_token": 0.000011, "cache_creation_input_token_cost": 0.00000138}, "us/gpt-4o-mini-2024-07-18" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-mini", "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.000000165, "output_cost_per_token": 0.00000066, "cache_read_input_token_cost": 0.000000083}, "us/gpt-4o-mini-realtime-preview-2024-12-17" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-mini-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000066, "output_cost_per_token": 0.00000264, "input_cost_per_audio_token": 0.000011, "cache_read_input_token_cost": 0.00000033, "output_cost_per_audio_token": 0.000022, "cache_creation_input_audio_token_cost": 0.00000033}, "us/gpt-4o-realtime-preview-2024-10-01" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.000022, "input_cost_per_audio_token": 0.00011, "cache_read_input_token_cost": 0.00000275, "output_cost_per_audio_token": 0.00022, "cache_creation_input_audio_token_cost": 0.000022}, "us/gpt-4o-realtime-preview-2024-12-17" : {"mode": "chat", "provider": "azure", "base_model": "gpt-4o-realtime", "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000055, "output_cost_per_token": 0.000022, "input_cost_per_audio_token": 0.000044, "cache_read_input_token_cost": 0.00000275, "output_cost_per_audio_token": 0.00008}, "us/gpt-5-2025-08-07" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000001375, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.0000001375}, "us/gpt-5-mini-2025-08-07" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000000275, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.0000000275}, "us/gpt-5-nano-2025-08-07" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5-nano", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000000055, "output_cost_per_token": 0.00000044, "cache_read_input_token_cost": 0.0000000055}, "us/gpt-5.1" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.1", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000138, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.00000014}, "us/gpt-5.1-chat" : {"mode": "chat", "provider": "azure", "base_model": "gpt-5.1-chat", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000138, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.00000014}, "us/gpt-5.1-codex" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.1-codex", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000138, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.00000014}, "us/gpt-5.1-codex-mini" : {"mode": "responses", "provider": "azure", "base_model": "gpt-5.1-codex-mini", "max_input_tokens": 272000, "max_output_tokens": 128000, "input_cost_per_token": 0.000000275, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.000000028}, "us/o1-2024-12-17" : {"mode": "chat", "provider": "azure", "base_model": "o1", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000165, "output_cost_per_token": 0.000066, "cache_read_input_token_cost": 0.00000825}, "us/o1-mini-2024-09-12" : {"mode": "chat", "provider": "azure", "base_model": "o1-mini", "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.00000121, "output_cost_per_token": 0.00000484, "cache_read_input_token_cost": 0.000000605, "input_cost_per_token_batches": 0.000000605, "output_cost_per_token_batches": 0.00000242}, "us/o1-preview-2024-09-12" : {"mode": "chat", "provider": "azure", "base_model": "o1", "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.0000165, "output_cost_per_token": 0.000066, "cache_read_input_token_cost": 0.00000825}, "us/o3-2025-04-16" : {"mode": "chat", "provider": "azure", "base_model": "o3", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000022, "output_cost_per_token": 0.0000088, "cache_read_input_token_cost": 0.00000055}, "us/o3-mini-2025-01-31" : {"mode": "chat", "provider": "azure", "base_model": "o3-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00000121, "output_cost_per_token": 0.00000484, "cache_read_input_token_cost": 0.000000605, "input_cost_per_token_batches": 0.000000605, "output_cost_per_token_batches": 0.00000242}, "us/o4-mini-2025-04-16" : {"mode": "chat", "provider": "azure", "base_model": "o4-mini", "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.00000121, "output_cost_per_token": 0.00000484, "cache_read_input_token_cost": 0.00000031}, "v0-1.0-md" : {"mode": "chat", "provider": "v0", "base_model": "v0-1.0-md", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "v0-1.5-lg" : {"mode": "chat", "provider": "v0", "base_model": "v0-1.5-lg", "max_input_tokens": 512000, "max_output_tokens": 512000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075}, "v0-1.5-md" : {"mode": "chat", "provider": "v0", "base_model": "v0-1.5-md", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "veo-2.0-generate-001" : {"mode": "video_generation", "provider": "vertex", "base_model": "veo-2.0-generate", "max_input_tokens": 1024, "output_cost_per_second": 0.35}, "veo-3.0-fast-generate-001" : {"mode": "video_generation", "provider": "vertex", "base_model": "veo-3.0-fast-generate", "max_input_tokens": 1024, "output_cost_per_second": 0.15}, "veo-3.0-generate-001" : {"mode": "video_generation", "provider": "vertex", "base_model": "veo-3.0-generate", "max_input_tokens": 1024, "output_cost_per_second": 0.4}, "veo-3.1-fast-generate-001" : {"mode": "video_generation", "provider": "vertex", "base_model": "veo-3.1-fast-generate", "max_input_tokens": 1024, "output_cost_per_second": 0.15}, "veo-3.1-fast-generate-preview" : {"mode": "video_generation", "provider": "vertex", "base_model": "veo-3.1-fast-generate", "max_input_tokens": 1024, "output_cost_per_second": 0.15}, "veo-3.1-generate-001" : {"mode": "video_generation", "provider": "vertex", "base_model": "veo-3.1-generate", "max_input_tokens": 1024, "output_cost_per_second": 0.4}, "veo-3.1-generate-preview" : {"mode": "video_generation", "provider": "vertex", "base_model": "veo-3.1-generate", "max_input_tokens": 1024, "output_cost_per_second": 0.4}, "veo-3.1-lite-generate-preview" : {"mode": "video_generation", "provider": "gemini", "base_model": "veo-3.1-lite-generate", "max_input_tokens": 1024, "output_cost_per_second": 0.05}, "vercel/v0-1.0-md" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "v0-1.0-md", "max_input_tokens": 128000, "max_output_tokens": 32000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "vercel/v0-1.5-md" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "v0-1.5-md", "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "vicuna" : {"mode": "completion", "provider": "ollama", "base_model": "vicuna", "max_input_tokens": 2048, "max_output_tokens": 2048, "input_cost_per_token": 0, "output_cost_per_token": 0}, "voyage-2" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-2", "max_input_tokens": 4000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "voyage-3" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-3", "max_input_tokens": 32000, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0}, "voyage-3-large" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-3-large", "max_input_tokens": 32000, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0}, "voyage-3-lite" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-3-lite", "max_input_tokens": 32000, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0}, "voyage-3.5" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-3.5", "max_input_tokens": 32000, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0}, "voyage-3.5-lite" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-3.5-lite", "max_input_tokens": 32000, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0}, "voyage-code-2" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-code-2", "max_input_tokens": 16000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "voyage-code-3" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-code-3", "max_input_tokens": 32000, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0}, "voyage-context-3" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-context-3", "max_input_tokens": 120000, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0}, "voyage-finance-2" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-finance-2", "max_input_tokens": 32000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "voyage-large-2" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-large-2", "max_input_tokens": 16000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "voyage-law-2" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-law-2", "max_input_tokens": 16000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "voyage-lite-01" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-lite-01", "max_input_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "voyage-lite-02-instruct" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-lite-02-instruct", "max_input_tokens": 4000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0}, "voyage-multimodal-3" : {"mode": "embedding", "provider": "voyage", "base_model": "voyage-multimodal-3", "max_input_tokens": 32000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0}, "wan-video/wan-2.2-5b-fast" : {"mode": "video_generation", "provider": "replicate", "base_model": "wan-video/wan-2.2-5b-fast", "output_cost_per_video_per_second": 0.002}, "wan-video/wan-2.2-i2v-fast" : {"mode": "video_generation", "provider": "replicate", "base_model": "wan-video/wan-2.2-i2v-fast", "output_cost_per_video_per_second": 0.01}, "wan-video/wan-2.2-t2v-fast" : {"mode": "video_generation", "provider": "replicate", "base_model": "wan-video/wan-2.2-t2v-fast", "output_cost_per_video_per_second": 0.01}, "whisper" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "whisper", "input_cost_per_second": 0.0001, "output_cost_per_second": 0}, "whisper-1" : {"mode": "audio_transcription", "provider": "openai", "base_model": "whisper-1", "input_cost_per_second": 0.0001, "output_cost_per_second": 0.0001}, "whisper-base" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "whisper-base", "input_cost_per_second": 0.0001, "output_cost_per_second": 0}, "whisper-large" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "whisper-large", "input_cost_per_second": 0.0001, "output_cost_per_second": 0}, "whisper-large-v3" : {"mode": "audio_transcription", "provider": "groq", "base_model": "whisper-large-v3", "input_cost_per_second": 0.00003083, "output_cost_per_second": 0}, "whisper-large-v3-turbo" : {"mode": "audio_transcription", "provider": "groq", "base_model": "whisper-large-v3-turbo", "input_cost_per_second": 0.00001111, "output_cost_per_second": 0}, "whisper-medium" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "whisper-medium", "input_cost_per_second": 0.0001, "output_cost_per_second": 0}, "whisper-small" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "whisper-small", "input_cost_per_second": 0.0001, "output_cost_per_second": 0}, "whisper-tiny" : {"mode": "audio_transcription", "provider": "deepgram", "base_model": "whisper-tiny", "input_cost_per_second": 0.0001, "output_cost_per_second": 0}, "writer.palmyra-x4-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "palmyra-x4", "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001}, "writer.palmyra-x5-v1:0" : {"mode": "chat", "provider": "bedrock", "base_model": "palmyra-x5", "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000006}, "writer/palmyra-x5" : {"mode": "chat", "provider": "openrouter", "base_model": "palmyra-x5", "max_input_tokens": 1040000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000006}, "x-ai/grok-4" : {"mode": "chat", "provider": "openrouter", "base_model": "grok-4", "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "x-ai/grok-4.20" : {"mode": "chat", "provider": "openrouter", "base_model": "grok-4.20", "max_input_tokens": 2000000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.0000002}, "x-ai/grok-4.20-multi-agent" : {"mode": "chat", "provider": "openrouter", "base_model": "grok-4.20-multi-agent", "max_input_tokens": 2000000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.0000002}, "x-ai/grok-4.3" : {"mode": "chat", "provider": "openrouter", "base_model": "grok-4.3", "max_input_tokens": 1000000, "input_cost_per_token": 0.00000125, "output_cost_per_token": 0.0000025, "cache_read_input_token_cost": 0.0000002}, "x-ai/grok-build-0.1" : {"mode": "chat", "provider": "openrouter", "base_model": "grok-build-0.1", "max_input_tokens": 256000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.0000002}, "x-ai/grok-voice-tts-1.0" : {"mode": "chat", "provider": "openrouter", "base_model": "grok-voice-tts-1.0", "max_input_tokens": 15000, "input_cost_per_token": 0.000015}, "xai.grok-3" : {"mode": "chat", "provider": "oci", "base_model": "grok-3", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "xai.grok-3-fast" : {"mode": "chat", "provider": "oci", "base_model": "grok-3-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025}, "xai.grok-3-mini" : {"mode": "chat", "provider": "oci", "base_model": "grok-3-mini", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000005}, "xai.grok-3-mini-fast" : {"mode": "chat", "provider": "oci", "base_model": "grok-3-mini-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000004}, "xai.grok-4" : {"mode": "chat", "provider": "oci", "base_model": "grok-4", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "xai.grok-4-fast" : {"mode": "chat", "provider": "oci", "base_model": "grok-4-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025}, "xai.grok-4.1-fast" : {"mode": "chat", "provider": "oci", "base_model": "grok-4.1-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025}, "xai.grok-4.20" : {"mode": "chat", "provider": "oci", "base_model": "grok-4.20", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "xai.grok-4.20-multi-agent" : {"mode": "chat", "provider": "oci", "base_model": "grok-4.20-multi-agent", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "xai.grok-code-fast-1" : {"mode": "chat", "provider": "oci", "base_model": "grok-code-fast-1", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025}, "xai/grok-2" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "grok-2", "max_input_tokens": 131072, "max_output_tokens": 4000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001}, "xai/grok-2-vision" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "grok-2-vision", "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001}, "xai/grok-3" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "grok-3", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015}, "xai/grok-3-fast" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "grok-3-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025}, "xai/grok-3-mini" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "grok-3-mini", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000005}, "xai/grok-3-mini-fast" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "grok-3-mini-fast", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.000004}, "xai/grok-4" : {"mode": "chat", "provider": "replicate", "base_model": "grok-4", "input_cost_per_token": 0.0000072, "output_cost_per_token": 0.000036}, "xai/grok-4-1-fast-non-reasoning" : {"mode": "responses", "provider": "perplexity", "base_model": "grok-4-1-fast-non"}, "xai/grok-4.1-fast-non-reasoning" : {"mode": "chat", "provider": "vertex", "base_model": "grok-4.1-fast-non-reasoning", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000005, "cache_read_input_token_cost": 0.00000005, "input_cost_per_token_above_128k_tokens": 0.0000004, "output_cost_per_token_above_128k_tokens": 0.000001}, "xai/grok-4.1-fast-reasoning" : {"mode": "chat", "provider": "vertex", "base_model": "grok-4.1-fast-non-reasoning", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000005, "cache_read_input_token_cost": 0.00000005, "input_cost_per_token_above_128k_tokens": 0.0000004, "output_cost_per_token_above_128k_tokens": 0.000001}, "xai/grok-4.20-beta-0309-non-reasoning" : {"mode": "chat", "provider": "vertex", "base_model": "grok-4.20", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.0000002}, "xai/grok-4.20-non-reasoning" : {"mode": "chat", "provider": "vertex", "base_model": "grok-4.20-non", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.0000002}, "xai/grok-4.20-reasoning" : {"mode": "chat", "provider": "vertex", "base_model": "grok-4.20-reasoning", "max_input_tokens": 2000000, "max_output_tokens": 2000000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "cache_read_input_token_cost": 0.0000002}, "xai/grok-imagine-image" : {"mode": "image_generation", "provider": "replicate", "base_model": "grok-imagine-image", "output_cost_per_image": 0.02}, "xiaomi/mimo-v2-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "mimo-v2-flash", "max_input_tokens": 262144, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003, "cache_read_input_token_cost": 0.00000001, "cache_creation_input_token_cost": 0}, "xiaomi/mimo-v2.5" : {"mode": "chat", "provider": "openrouter", "base_model": "mimo", "max_input_tokens": 1048576, "max_output_tokens": 131072, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002, "cache_read_input_token_cost": 0.00000008, "cache_creation_input_token_cost": 0}, "xiaomi/mimo-v2.5-pro" : {"mode": "chat", "provider": "openrouter", "base_model": "mimo-v2.5-pro", "max_input_tokens": 1048576, "max_output_tokens": 16384, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003, "cache_read_input_token_cost": 0.0000002, "cache_creation_input_token_cost": 0}, "xiaomimimo/mimo-v2-flash" : {"mode": "chat", "provider": "novita", "base_model": "mimo-v2-flash", "max_input_tokens": 262144, "max_output_tokens": 32000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000003, "cache_read_input_token_cost": 0.00000002}, "z-ai/glm-4-32b" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-4-32b", "max_input_tokens": 128000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001}, "z-ai/glm-4.5" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-4.5", "max_input_tokens": 131072, "max_output_tokens": 98304, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.00000011}, "z-ai/glm-4.5-air" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-4.5-air", "max_input_tokens": 131070, "max_output_tokens": 131070, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.00000085, "cache_read_input_token_cost": 0.00000006}, "z-ai/glm-4.5v" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-4.5v", "max_input_tokens": 65536, "max_output_tokens": 16384, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000018, "cache_read_input_token_cost": 0.00000011}, "z-ai/glm-4.6" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-4.6", "max_input_tokens": 202800, "max_output_tokens": 131000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.00000175, "cache_read_input_token_cost": 0.00000008}, "z-ai/glm-4.6:exacto" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-4.6", "max_input_tokens": 202800, "max_output_tokens": 131000, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000019}, "z-ai/glm-4.6v" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-4.6v", "max_input_tokens": 131072, "max_output_tokens": 24000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000009, "cache_read_input_token_cost": 0.00000005}, "z-ai/glm-4.7" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-4.7", "max_input_tokens": 202752, "max_output_tokens": 64000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000015, "cache_read_input_token_cost": 0, "cache_creation_input_token_cost": 0}, "z-ai/glm-4.7-flash" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-4.7-flash", "max_input_tokens": 200000, "max_output_tokens": 32000, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.0000004, "cache_read_input_token_cost": 0, "cache_creation_input_token_cost": 0}, "z-ai/glm-5" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-5", "max_input_tokens": 202752, "max_output_tokens": 128000, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.00000256, "cache_read_input_token_cost": 0.00000012}, "z-ai/glm-5-turbo" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-5-turbo", "max_input_tokens": 202752, "max_output_tokens": 131072, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.000004, "cache_read_input_token_cost": 0.00000024}, "z-ai/glm-5.1" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-5.1", "max_input_tokens": 202752, "max_output_tokens": 131072, "input_cost_per_token": 0.00000098, "output_cost_per_token": 0.00000308, "cache_read_input_token_cost": 0.000000182}, "z-ai/glm-5v-turbo" : {"mode": "chat", "provider": "openrouter", "base_model": "glm-5v-turbo", "max_input_tokens": 202752, "max_output_tokens": 131072, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.000004, "cache_read_input_token_cost": 0.00000024}, "zai-glm-4.6" : {"mode": "chat", "provider": "cerebras", "base_model": "glm-4.6", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000225, "output_cost_per_token": 0.00000275}, "zai-glm-4.7" : {"mode": "chat", "provider": "cerebras", "base_model": "glm-4.7", "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000225, "output_cost_per_token": 0.00000275}, "zai-org/GLM-4.5" : {"mode": "chat", "provider": "deepinfra", "base_model": "glm-4.5", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000016}, "zai-org/GLM-4.5-Air-FP8" : {"mode": "chat", "provider": "together_ai", "base_model": "glm-4.5-air-fp8", "max_input_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000011}, "zai-org/GLM-4.6" : {"mode": "chat", "provider": "together_ai", "base_model": "glm-4.6", "max_input_tokens": 200000, "max_output_tokens": 200000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022}, "zai-org/GLM-4.7" : {"mode": "chat", "provider": "baseten", "base_model": "glm-4.7", "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022}, "zai-org/GLM-4.7-FP8" : {"mode": "chat", "provider": "gmi", "base_model": "glm-4.7-fp8", "max_input_tokens": 202752, "max_output_tokens": 16384, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.000002}, "zai-org/GLM-5" : {"mode": "chat", "provider": "baseten", "base_model": "glm-5", "input_cost_per_token": 0.00000095, "output_cost_per_token": 0.00000315}, "zai-org/autoglm-phone-9b-multilingual" : {"mode": "chat", "provider": "novita", "base_model": "autoglm-phone-9b-multilingual", "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.000000035, "output_cost_per_token": 0.000000138}, "zai-org/glm-4.5" : {"mode": "chat", "provider": "novita", "base_model": "glm-4.5", "max_input_tokens": 131072, "max_output_tokens": 98304, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.00000011}, "zai-org/glm-4.5-air" : {"mode": "chat", "provider": "novita", "base_model": "glm-4.5-air", "max_input_tokens": 131072, "max_output_tokens": 98304, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000085}, "zai-org/glm-4.5v" : {"mode": "chat", "provider": "novita", "base_model": "glm-4.5v", "max_input_tokens": 65536, "max_output_tokens": 16384, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000018, "cache_read_input_token_cost": 0.00000011}, "zai-org/glm-4.6" : {"mode": "chat", "provider": "novita", "base_model": "glm-4.6", "max_input_tokens": 204800, "max_output_tokens": 131072, "input_cost_per_token": 0.00000055, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.00000011}, "zai-org/glm-4.6v" : {"mode": "chat", "provider": "novita", "base_model": "glm-4.6v", "max_input_tokens": 131072, "max_output_tokens": 32768, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000009, "cache_read_input_token_cost": 0.000000055}, "zai-org/glm-4.7" : {"mode": "chat", "provider": "novita", "base_model": "glm-4.7", "max_input_tokens": 204800, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022, "cache_read_input_token_cost": 0.00000011}, "zai-org/glm-4.7-maas" : {"mode": "chat", "provider": "vertex", "base_model": "glm-4.7", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022}, "zai-org/glm-5-maas" : {"mode": "chat", "provider": "vertex", "base_model": "glm-5", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.0000032, "cache_read_input_token_cost": 0.0000001}, "zai.glm-4.7" : {"mode": "chat", "provider": "bedrock", "base_model": "zai.glm-4.7", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022}, "zai.glm-4.7-flash" : {"mode": "chat", "provider": "bedrock", "base_model": "zai.glm-4.7-flash", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.0000004}, "zai.glm-5" : {"mode": "chat", "provider": "bedrock", "base_model": "zai.glm-5", "max_input_tokens": 200000, "max_output_tokens": 128000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.0000032}, "zai/glm-4.5" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "glm-4.5", "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000022}, "zai/glm-4.5-air" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "glm-4.5-air", "max_input_tokens": 128000, "max_output_tokens": 96000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000011}, "zai/glm-4.6" : {"mode": "chat", "provider": "vercel_ai_gateway", "base_model": "glm-4.6", "max_input_tokens": 200000, "max_output_tokens": 200000, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000018, "cache_read_input_token_cost": 0.00000011}, "zyphra/zonos-v0.1-hybrid" : {"mode": "chat", "provider": "openrouter", "base_model": "zonos-v0.1-hybrid", "max_input_tokens": 4096, "input_cost_per_token": 0.000007}, "zyphra/zonos-v0.1-transformer" : {"mode": "chat", "provider": "openrouter", "base_model": "zonos-v0.1-transformer", "max_input_tokens": 4096, "input_cost_per_token": 0.000007}, "~anthropic/claude-haiku-latest" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-haiku-latest", "max_input_tokens": 200000, "max_output_tokens": 64000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_read_input_token_cost": 0.0000001, "cache_creation_input_token_cost": 0.00000125}, "~anthropic/claude-opus-latest" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-opus-latest", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000025, "cache_read_input_token_cost": 0.0000005, "cache_creation_input_token_cost": 0.00000625}, "~anthropic/claude-sonnet-latest" : {"mode": "chat", "provider": "openrouter", "base_model": "claude-sonnet-latest", "max_input_tokens": 1000000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_token_cost": 0.00000375}, "~google/gemini-flash-latest" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-flash-latest", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.0000015, "output_cost_per_image": 0.0000015, "output_cost_per_token": 0.000009, "cache_read_input_token_cost": 0.00000015, "cache_creation_input_token_cost": 0.00000008333333333333334}, "~google/gemini-pro-latest" : {"mode": "chat", "provider": "openrouter", "base_model": "gemini-pro-latest", "max_input_tokens": 1048576, "max_output_tokens": 65536, "input_cost_per_token": 0.000002, "output_cost_per_image": 0.000002, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000002, "cache_creation_input_token_cost": 0.000000375}, "~moonshotai/kimi-latest" : {"mode": "chat", "provider": "openrouter", "base_model": "kimi-latest", "max_input_tokens": 262144, "max_output_tokens": 262144, "input_cost_per_token": 0.000000684, "output_cost_per_token": 0.00000342, "cache_read_input_token_cost": 0.000000144}, "~openai/gpt-latest" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-latest", "max_input_tokens": 1050000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.00003, "cache_read_input_token_cost": 0.0000005}, "~openai/gpt-mini-latest" : {"mode": "chat", "provider": "openrouter", "base_model": "gpt-mini-latest", "max_input_tokens": 400000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000075, "output_cost_per_token": 0.0000045, "cache_read_input_token_cost": 0.000000075} }
