{"models":[{"model_id":"dos-auto","display_name":"DOS.AI Auto","provider":"dos-ai","input_price_per_million":0,"output_price_per_million":0,"context_length":131072,"description":"Smart routing - automatically picks the best model for your request. Free for simple tasks, paid models for complex ones.","capabilities":{}},{"model_id":"dos-ai","display_name":"DOS.AI","provider":"dos-ai","input_price_per_million":1,"output_price_per_million":1,"context_length":131072,"description":"Ultra-efficient MoE model — 35B total, 3B active parameters. Fast inference at near-8B cost with 70B-class quality.","capabilities":{"category":"chat","is_featured":true,"is_new":true,"parameters":"35B MoE (3B active)","streaming":true,"tools":true}},{"model_id":"deepseek-v3","display_name":"DeepSeek V3","provider":"deepseek","input_price_per_million":16,"output_price_per_million":31,"context_length":65536,"description":"DeepSeek V3 — frontier open model. Excellent reasoning and coding.","capabilities":{"category":"chat","is_featured":true,"is_new":true,"parameters":"671B MoE","streaming":true,"tools":true}},{"model_id":"qwen3.5-27b","display_name":"Qwen 3.5 27B","provider":"alibaba","input_price_per_million":33,"output_price_per_million":264,"context_length":262144,"description":"Efficient dense model for everyday tasks — fast inference with competitive quality.","capabilities":{"category":"chat","is_new":true,"parameters":"27B"}},{"model_id":"llama-4-scout","display_name":"Llama 4 Scout 17B-16E","provider":"deepinfra","input_price_per_million":11,"output_price_per_million":38,"context_length":655360,"description":"Meta Llama 4 Scout — 17B active params, 16 experts MoE. Fast and efficient for everyday tasks.","capabilities":{"category":"chat","is_new":true,"parameters":"17B-16E MoE"}},{"model_id":"qwen3.5-122b-a10b","display_name":"Qwen 3.5 122B-A10B","provider":"alibaba","input_price_per_million":44,"output_price_per_million":352,"context_length":262144,"description":"High-capability MoE model — 122B total, 10B active. Strong balance of performance and cost.","capabilities":{"category":"chat","is_new":true,"parameters":"122B MoE (10B active)"}},{"model_id":"llama-4-maverick","display_name":"Llama 4 Maverick 17B-128E","provider":"deepinfra","input_price_per_million":17,"output_price_per_million":66,"context_length":1048576,"description":"Meta Llama 4 Maverick — 17B active params, 128 experts MoE. Strong reasoning and multilingual.","capabilities":{"category":"chat","is_featured":true,"is_new":true,"parameters":"17B-128E MoE"}},{"model_id":"qwen3.5-397b-a17b","display_name":"Qwen 3.5 397B-A17B","provider":"alibaba","input_price_per_million":66,"output_price_per_million":396,"context_length":262144,"description":"Flagship open-source MoE model — 397B total, 17B active parameters. Top-tier reasoning and coding.","capabilities":{"category":"chat","is_featured":true,"is_new":true,"parameters":"397B MoE (17B active)"}},{"model_id":"wan2.7-t2v","display_name":"Wan 2.7 Text-to-Video","provider":"alibaba","input_price_per_million":10000,"output_price_per_million":0,"description":"Video generation from text prompt via Alibaba Wan 2.7. Duration 2-15s, 1080P, native audio. Pricing: per 1000 seconds.","capabilities":{}},{"model_id":"wan2.7-i2v","display_name":"Wan 2.7 Image-to-Video","provider":"alibaba","input_price_per_million":10000,"output_price_per_million":0,"description":"Video generation from image + text prompt via Alibaba Wan 2.7. Pricing: per 1000 seconds.","capabilities":{}},{"model_id":"minimax-music-2.5","display_name":"MiniMax Music 2.5+","provider":"minimax","input_price_per_million":5000,"output_price_per_million":0,"description":"Music generation with vocals or instrumental. ~3 min per track. Price: per 1000 seconds of audio.","capabilities":{}},{"model_id":"claude-sonnet-4.6","display_name":"Claude Sonnet 4.6","provider":"anthropic","input_price_per_million":315,"output_price_per_million":1575,"context_length":200000,"description":"Fast, intelligent model for everyday tasks","capabilities":{"category":"chat","vision":true}},{"model_id":"claude-haiku-4.5","display_name":"Claude Haiku 4.5","provider":"anthropic","input_price_per_million":105,"output_price_per_million":525,"context_length":200000,"description":"Fastest and most compact Claude model","capabilities":{"category":"chat","vision":true}},{"model_id":"claude-opus-4.6","display_name":"Claude Opus 4.6","provider":"anthropic","input_price_per_million":525,"output_price_per_million":2625,"context_length":200000,"description":"Most powerful Claude model for complex tasks","capabilities":{"category":"chat","vision":true}},{"model_id":"gpt-5.4","display_name":"GPT-5.4","provider":"openai","input_price_per_million":263,"output_price_per_million":1575,"context_length":1000000,"description":"Most capable GPT model for agentic, coding, and professional workflows","capabilities":{"category":"chat","vision":true}},{"model_id":"gpt-5.4-mini","display_name":"GPT-5.4 Mini","provider":"openai","input_price_per_million":79,"output_price_per_million":473,"context_length":400000,"description":"Strong mini model for coding, computer use, and sub-agents","capabilities":{"category":"chat","vision":true}},{"model_id":"gpt-5.4-nano","display_name":"GPT-5.4 Nano","provider":"openai","input_price_per_million":21,"output_price_per_million":131,"context_length":400000,"description":"Cheapest GPT-5.4-class model for simple high-volume tasks","capabilities":{"category":"chat","vision":true}},{"model_id":"gemini-3.1-pro","display_name":"Gemini 3.1 Pro","provider":"google","input_price_per_million":210,"output_price_per_million":1260,"context_length":1000000,"description":"Google's most advanced reasoning model for complex tasks","capabilities":{"category":"chat","vision":true}},{"model_id":"gemini-3-flash","display_name":"Gemini 3 Flash","provider":"google","input_price_per_million":53,"output_price_per_million":315,"context_length":1000000,"description":"Frontier-class performance at reduced cost","capabilities":{"category":"chat","vision":true}},{"model_id":"gemini-3.1-flash-lite","display_name":"Gemini 3.1 Flash-Lite","provider":"google","input_price_per_million":26,"output_price_per_million":158,"context_length":1000000,"description":"Fastest and most cost-efficient Gemini 3 model","capabilities":{"category":"chat","vision":true}},{"model_id":"gemini-3.1-flash-live","display_name":"Gemini 3.1 Flash Live","provider":"google","input_price_per_million":79,"output_price_per_million":473,"context_length":1000000,"description":"Real-time voice and dialogue model","capabilities":{"category":"chat","vision":true}},{"model_id":"grok-4.20","display_name":"Grok 4.20","provider":"xai","input_price_per_million":210,"output_price_per_million":630,"context_length":2000000,"description":"xAI flagship reasoning model with 2M context","capabilities":{"category":"chat","reasoning":true,"vision":true}},{"model_id":"grok-4.1-fast","display_name":"Grok 4.1 Fast","provider":"xai","input_price_per_million":21,"output_price_per_million":53,"context_length":2000000,"description":"Near-frontier performance at budget pricing with 2M context","capabilities":{"category":"chat","reasoning":true,"vision":true}}]}