{ "data": [ { "id": "zai-org/GLM-4.5", "object": "model", "created": 1752981936, "owned_by": "zai-org", "providers": [ { "provider": "novita", "status": "live", "pricing": { "input": 60, "output": 220 }, "context_length": 131072, "supports_tools": true, "supports_structured_output": true, "supports_response_format": true, "supports_function_calling": true, "latency_s": 5.95, "throughput_tps": 48.9, "performance_tested_at": "2025-08-04T09:02:05.950Z" } ] }, { "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", "object": "model", "created": 1753195958, "owned_by": "Qwen", "providers": [ { "provider": "novita", "status": "live", "context_length": 262144, "pricing": { "input": 0.95, "output": 5 }, "supports_tools": true, "supports_structured_output": false, "supports_function_calling": true, "supports_response_format": true, "latency_s": 1.47, "throughput_tps": 21.09, "performance_tested_at": "2025-08-04T09:02:01.469Z" }, { "provider": "cerebras", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 4.5, "throughput_tps": 7.77, "performance_tested_at": "2025-08-04T09:02:04.503Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 0.7, "throughput_tps": 48.7, "performance_tested_at": "2025-08-04T09:02:00.698Z" }, { "provider": "together", "status": "live", "context_length": 262144, "pricing": { "input": 2, "output": 2 }, "supports_tools": false, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 10, "throughput_tps": 3.4, "performance_tested_at": "2025-08-04T09:02:09.996Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 3.2, "throughput_tps": 10.64, "performance_tested_at": "2025-08-04T09:02:03.196Z" } ] }, { "id": "moonshotai/Kimi-K2-Instruct", "object": "model", "created": 1752195312, "owned_by": "moonshotai", "providers": [ { "provider": "novita", "status": "live", "pricing": { "input": 57, "output": 230 }, "context_length": 131072, "supports_tools": true, "supports_structured_output": true, "supports_function_calling": true, "supports_response_format": true, "latency_s": 1.06, "throughput_tps": 28.42, "performance_tested_at": "2025-08-04T09:02:01.055Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 1.07, "throughput_tps": 37.37, "performance_tested_at": "2025-08-04T09:02:01.070Z" }, { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "HTTP 400 Bad Request", "performance_tested_at": "2025-08-04T09:02:02.113Z" }, { "provider": "groq", "status": "live", "context_length": 131072, "latency_s": 0.37, "throughput_tps": 131.18, "performance_tested_at": "2025-08-04T09:02:00.366Z" } ] }, { "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", "object": "model", "created": 1753419545, "owned_by": "Qwen", "providers": [ { "provider": "novita", "status": "live", "context_length": 131072, "pricing": { "input": 0.3, "output": 3 }, "supports_tools": true, "supports_structured_output": false, "supports_function_calling": true, "supports_response_format": true, "latency_s": 6.76, "throughput_tps": 78.85, "performance_tested_at": "2025-08-04T09:02:06.760Z" }, { "provider": "cerebras", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 0.96, "throughput_tps": 355.8, "performance_tested_at": "2025-08-04T09:02:00.955Z" } ] }, { "id": "CohereLabs/command-a-vision-07-2025", "object": "model", "created": 1753689307, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 1.69, "throughput_tps": 44.37, "performance_tested_at": "2025-08-04T09:02:01.690Z" } ] }, { "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", "object": "model", "created": 1753080416, "owned_by": "Qwen", "providers": [ { "provider": "novita", "status": "live", "context_length": 262144, "pricing": { "input": 0.15, "output": 0.8 }, "supports_tools": true, "supports_structured_output": true, "supports_response_format": true, "supports_function_calling": true, "latency_s": 0.77, "throughput_tps": 44.37, "performance_tested_at": "2025-08-04T09:02:00.766Z" }, { "provider": "nebius", "status": "offline", "supports_tools": true, "supports_structured_output": true, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:02:30.001Z" }, { "provider": "cerebras", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 0.49, "throughput_tps": 70.83, "performance_tested_at": "2025-08-04T09:02:00.494Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 0.79, "throughput_tps": 43.05, "performance_tested_at": "2025-08-04T09:02:00.789Z" }, { "provider": "together", "status": "live", "context_length": 262144, "pricing": { "input": 0.2, "output": 0.6 }, "supports_tools": true, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 0.67, "throughput_tps": 48.91, "performance_tested_at": "2025-08-04T09:02:00.674Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 1.75, "throughput_tps": 20, "performance_tested_at": "2025-08-04T09:02:01.750Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 0.75, "throughput_tps": 42.6, "performance_tested_at": "2025-08-04T09:02:00.751Z" } ] }, { "id": "meta-llama/Llama-3.1-8B-Instruct", "object": "model", "created": 1721292960, "owned_by": "meta-llama", "providers": [ { "provider": "novita", "status": "live", "context_length": 16384, "pricing": { "input": 0.02, "output": 0.05 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 0.81, "throughput_tps": 72.84, "performance_tested_at": "2025-08-04T09:02:31.814Z" }, { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.03, "output": 0.09 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 0.44, "throughput_tps": 72.65, "performance_tested_at": "2025-08-04T09:02:31.445Z" }, { "provider": "cerebras", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 0.46, "throughput_tps": 127.5, "performance_tested_at": "2025-08-04T09:02:31.467Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": false, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 0.38, "throughput_tps": 86.94, "performance_tested_at": "2025-08-04T09:02:31.384Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 7.23, "throughput_tps": 3.87, "performance_tested_at": "2025-08-04T09:02:38.233Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 1.39, "throughput_tps": 23.76, "performance_tested_at": "2025-08-04T09:02:32.395Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 0.7, "throughput_tps": 82.27, "performance_tested_at": "2025-08-04T09:02:31.711Z" }, { "provider": "sambanova", "status": "live", "context_length": 16384, "pricing": { "input": 0.1, "output": 0.2 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 0.53, "throughput_tps": 107.02, "performance_tested_at": "2025-08-04T09:02:31.539Z" } ] }, { "id": "zai-org/GLM-4.5-Air-FP8", "object": "model", "created": 1752982200, "owned_by": "zai-org", "providers": [ { "provider": "together", "status": "live", "supports_tools": false, "supports_structured_output": true, "pricing": { "input": 65, "output": 0 }, "context_length": 32768, "supports_stop_sequences": true, "latency_s": 2.67, "throughput_tps": 99.6, "performance_tested_at": "2025-08-04T09:02:33.677Z" } ] }, { "id": "HuggingFaceTB/SmolLM3-3B", "object": "model", "created": 1751969505, "owned_by": "HuggingFaceTB", "providers": [ { "provider": "hf-inference", "status": "offline", "supports_tools": true, "supports_structured_output": true, "performance_error": "HTTP 404 Not Found", "performance_tested_at": "2025-08-04T09:02:31.217Z" } ] }, { "id": "deepseek-ai/DeepSeek-R1", "object": "model", "created": 1737344767, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "context_length": 64000, "pricing": { "input": 0.7, "output": 2.5 }, "supports_tools": true, "supports_structured_output": false, "supports_function_calling": true, "supports_response_format": true, "latency_s": 6.51, "throughput_tps": 23.35, "performance_tested_at": "2025-08-04T09:02:37.516Z" }, { "provider": "nebius", "status": "live", "context_length": 163840, "pricing": { "input": 2, "output": 6 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 3.92, "throughput_tps": 71.42, "performance_tested_at": "2025-08-04T09:02:34.927Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": false, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 3.73, "throughput_tps": 70.06, "performance_tested_at": "2025-08-04T09:02:34.732Z" }, { "provider": "together", "status": "offline", "context_length": 163840, "pricing": { "input": 3, "output": 7 }, "supports_tools": false, "supports_structured_output": true, "supports_stop_sequences": true, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:03:01.007Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 3.35, "throughput_tps": 56.99, "performance_tested_at": "2025-08-04T09:02:34.358Z" }, { "provider": "sambanova", "status": "live", "supports_tools": false, "supports_structured_output": false, "pricing": { "input": 5, "output": 7 }, "context_length": 32768, "latency_s": 14.05, "throughput_tps": 118.05, "performance_tested_at": "2025-08-04T09:02:45.120Z" } ] }, { "id": "Qwen/Qwen3-30B-A3B", "object": "model", "created": 1745725385, "owned_by": "Qwen", "providers": [ { "provider": "novita", "status": "live", "context_length": 40960, "pricing": { "input": 0.1, "output": 0.45 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 24.67, "throughput_tps": 12.36, "performance_tested_at": "2025-08-04T09:02:55.679Z" }, { "provider": "nebius", "status": "live", "context_length": 40960, "pricing": { "input": 0.3, "output": 0.9 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 2.38, "throughput_tps": 124.51, "performance_tested_at": "2025-08-04T09:02:33.384Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 2, "throughput_tps": 111.18, "performance_tested_at": "2025-08-04T09:02:33.003Z" } ] }, { "id": "Qwen/Qwen3-8B", "object": "model", "created": 1745725341, "owned_by": "Qwen", "providers": [ { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 9.66, "throughput_tps": 18.84, "performance_tested_at": "2025-08-04T09:02:40.667Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 3.77, "throughput_tps": 62.78, "performance_tested_at": "2025-08-04T09:03:05.784Z" } ] }, { "id": "google/gemma-3-27b-it", "object": "model", "created": 1740856219, "owned_by": "google", "providers": [ { "provider": "nebius", "status": "live", "context_length": 110000, "pricing": { "input": 0.2, "output": 0.6 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.46, "throughput_tps": 75.3, "performance_tested_at": "2025-08-04T09:03:02.474Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 16.71, "throughput_tps": 3.83, "performance_tested_at": "2025-08-04T09:03:18.719Z" } ] }, { "id": "zai-org/GLM-4.1V-9B-Thinking", "object": "model", "created": 1751120650, "owned_by": "zai-org", "providers": [ { "provider": "novita", "status": "live", "context_length": 65536, "pricing": { "input": 0.035, "output": 0.138 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 1.31, "throughput_tps": 70.18, "performance_tested_at": "2025-08-04T09:03:03.320Z" } ] }, { "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", "object": "model", "created": 1753197829, "owned_by": "Qwen", "providers": [ { "provider": "together", "status": "live", "context_length": 262144, "pricing": { "input": 2, "output": 2 }, "supports_tools": false, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 1.1, "throughput_tps": 31.9, "performance_tested_at": "2025-08-04T09:03:03.107Z" } ] }, { "id": "deepseek-ai/DeepSeek-R1-0528", "object": "model", "created": 1748425602, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "pricing": { "input": 70, "output": 250 }, "context_length": 163840, "supports_tools": true, "supports_structured_output": true, "supports_function_calling": true, "supports_response_format": true, "latency_s": 17.97, "throughput_tps": 26.27, "performance_tested_at": "2025-08-04T09:03:19.977Z" }, { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.8, "output": 2.4 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 11.03, "throughput_tps": 28.74, "performance_tested_at": "2025-08-04T09:03:13.038Z" }, { "provider": "fireworks-ai", "status": "live", "context_length": 163840, "supports_tools": false, "supports_image_input": false, "supports_function_calling": false, "latency_s": 1.03, "throughput_tps": 82.88, "performance_tested_at": "2025-08-04T09:03:03.035Z" }, { "provider": "together", "status": "live", "pricing": { "input": 65, "output": 0 }, "context_length": 32768, "supports_stop_sequences": true, "latency_s": 4.66, "throughput_tps": 30.7, "performance_tested_at": "2025-08-04T09:03:06.668Z" }, { "provider": "hyperbolic", "status": "live", "latency_s": 3.11, "throughput_tps": 75.29, "performance_tested_at": "2025-08-04T09:03:05.118Z" }, { "provider": "sambanova", "status": "live", "pricing": { "input": 5, "output": 7 }, "context_length": 32768, "latency_s": 17.96, "throughput_tps": 126.51, "performance_tested_at": "2025-08-04T09:03:19.977Z" } ] }, { "id": "Qwen/Qwen2.5-VL-7B-Instruct", "object": "model", "created": 1737883597, "owned_by": "Qwen", "providers": [ { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 0.59, "throughput_tps": 77.4, "performance_tested_at": "2025-08-04T09:03:02.604Z" } ] }, { "id": "meta-llama/Meta-Llama-3-8B-Instruct", "object": "model", "created": 1713346512, "owned_by": "meta-llama", "providers": [ { "provider": "novita", "status": "live", "context_length": 8192, "pricing": { "input": 0.04, "output": 0.04 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 0.97, "throughput_tps": 59.51, "performance_tested_at": "2025-08-04T09:03:02.984Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 4.55, "throughput_tps": 6.6, "performance_tested_at": "2025-08-04T09:03:06.556Z" }, { "provider": "groq", "status": "live", "context_length": 8192, "pricing": { "input": 0.05, "output": 0.08 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 0.51, "throughput_tps": 71.01, "performance_tested_at": "2025-08-04T09:03:02.517Z" } ] }, { "id": "meta-llama/Llama-3.2-3B-Instruct", "object": "model", "created": 1726672760, "owned_by": "meta-llama", "providers": [ { "provider": "novita", "status": "live", "context_length": 32768, "pricing": { "input": 0.03, "output": 0.05 }, "supports_tools": true, "supports_structured_output": false, "supports_function_calling": true, "latency_s": 0.9, "throughput_tps": 63.17, "performance_tested_at": "2025-08-04T09:03:02.912Z" }, { "provider": "together", "status": "offline", "context_length": 131072, "pricing": { "input": 0.060000000000000005, "output": 0.060000000000000005 }, "supports_tools": false, "supports_structured_output": false, "supports_stop_sequences": true, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:03:32.011Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 1.08, "throughput_tps": 46.38, "performance_tested_at": "2025-08-04T09:03:03.087Z" } ] }, { "id": "Qwen/Qwen3-32B", "object": "model", "created": 1745725979, "owned_by": "Qwen", "providers": [ { "provider": "novita", "status": "live", "context_length": 40960, "pricing": { "input": 0.1, "output": 0.45 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 14.2, "throughput_tps": 43.94, "performance_tested_at": "2025-08-04T09:03:16.210Z" }, { "provider": "nebius", "status": "live", "context_length": 40960, "pricing": { "input": 0.1, "output": 0.3 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 11.13, "throughput_tps": 32.16, "performance_tested_at": "2025-08-04T09:03:13.142Z" }, { "provider": "cerebras", "status": "live", "pricing": { "input": 0.4, "output": 0.8 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 0.48, "throughput_tps": 368.47, "performance_tested_at": "2025-08-04T09:03:33.490Z" }, { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:04:03.013Z" }, { "provider": "groq", "status": "live", "context_length": 131072, "pricing": { "input": 0.29, "output": 0.59 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 1.25, "throughput_tps": 186.18, "performance_tested_at": "2025-08-04T09:03:34.264Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 10.08, "throughput_tps": 28.57, "performance_tested_at": "2025-08-04T09:03:43.093Z" }, { "provider": "sambanova", "status": "live", "context_length": 32768, "pricing": { "input": 0.4, "output": 0.8 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 1.97, "throughput_tps": 261.95, "performance_tested_at": "2025-08-04T09:03:34.991Z" } ] }, { "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", "object": "model", "created": 1748516867, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "context_length": 128000, "pricing": { "input": 0.06, "output": 0.09 }, "supports_tools": false, "supports_structured_output": false, "supports_function_calling": true, "supports_response_format": true, "latency_s": 6.38, "throughput_tps": 85.84, "performance_tested_at": "2025-08-04T09:03:39.396Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 9.96, "throughput_tps": 0, "performance_tested_at": "2025-08-04T09:03:42.973Z" } ] }, { "id": "deepseek-ai/DeepSeek-V3-0324", "object": "model", "created": 1742808502, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "context_length": 163840, "pricing": { "input": 0.28, "output": 1.14 }, "supports_tools": true, "supports_structured_output": false, "supports_function_calling": true, "supports_response_format": true, "latency_s": 2.15, "throughput_tps": 19.11, "performance_tested_at": "2025-08-04T09:03:35.158Z" }, { "provider": "nebius", "status": "live", "context_length": 163840, "pricing": { "input": 2, "output": 6 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 0.88, "throughput_tps": 48.6, "performance_tested_at": "2025-08-04T09:03:33.897Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 1.41, "throughput_tps": 49.77, "performance_tested_at": "2025-08-04T09:03:34.419Z" }, { "provider": "together", "status": "live", "context_length": 131072, "pricing": { "input": 1.25, "output": 1.25 }, "supports_tools": true, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 1.37, "throughput_tps": 29.89, "performance_tested_at": "2025-08-04T09:03:34.385Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 1.5, "throughput_tps": 27.37, "performance_tested_at": "2025-08-04T09:03:34.510Z" }, { "provider": "sambanova", "status": "live", "context_length": 32768, "pricing": { "input": 3, "output": 4.5 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 1.06, "throughput_tps": 34.89, "performance_tested_at": "2025-08-04T09:03:34.073Z" } ] }, { "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", "object": "model", "created": 1737363858, "owned_by": "deepseek-ai", "providers": [ { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 27.68, "throughput_tps": 26.92, "performance_tested_at": "2025-08-04T09:04:00.688Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 3.39, "throughput_tps": 169.05, "performance_tested_at": "2025-08-04T09:03:36.402Z" } ] }, { "id": "meta-llama/Llama-3.3-70B-Instruct", "object": "model", "created": 1732637327, "owned_by": "meta-llama", "providers": [ { "provider": "novita", "status": "live", "context_length": 131072, "pricing": { "input": 0.13, "output": 0.39 }, "supports_tools": true, "supports_structured_output": false, "supports_function_calling": true, "latency_s": 0.61, "throughput_tps": 96.29, "performance_tested_at": "2025-08-04T09:03:33.625Z" }, { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.25, "output": 0.75 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 0.45, "throughput_tps": 128.36, "performance_tested_at": "2025-08-04T09:03:33.464Z" }, { "provider": "cerebras", "status": "live", "pricing": { "input": 0.85, "output": 1.2 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 15.09, "throughput_tps": 3.91, "performance_tested_at": "2025-08-04T09:03:48.106Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": false, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 0.66, "throughput_tps": 86.78, "performance_tested_at": "2025-08-04T09:03:33.669Z" }, { "provider": "together", "status": "live", "context_length": 131072, "pricing": { "input": 0.88, "output": 0.88 }, "supports_tools": true, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 0.56, "throughput_tps": 103.62, "performance_tested_at": "2025-08-04T09:03:33.572Z" }, { "provider": "groq", "status": "live", "context_length": 131072, "pricing": { "input": 0.59, "output": 0.79 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 0.3, "throughput_tps": 195.82, "performance_tested_at": "2025-08-04T09:04:04.311Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 1.19, "throughput_tps": 29.32, "performance_tested_at": "2025-08-04T09:04:05.208Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 1.04, "throughput_tps": 58.74, "performance_tested_at": "2025-08-04T09:04:05.053Z" }, { "provider": "sambanova", "status": "live", "context_length": 131072, "pricing": { "input": 0.6, "output": 1.2 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 0.47, "throughput_tps": 128.28, "performance_tested_at": "2025-08-04T09:04:04.482Z" } ] }, { "id": "google/gemma-2-2b-it", "object": "model", "created": 1721127099, "owned_by": "google", "providers": [ { "provider": "nebius", "status": "live", "context_length": 8192, "pricing": { "input": 0.02, "output": 0.06 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.38, "throughput_tps": 107.92, "performance_tested_at": "2025-08-04T09:04:04.394Z" } ] }, { "id": "zai-org/GLM-4-32B-0414", "object": "model", "created": 1744030421, "owned_by": "zai-org", "providers": [ { "provider": "novita", "status": "live", "context_length": 32000, "pricing": { "input": 0.24, "output": 0.24 }, "supports_tools": false, "supports_structured_output": true, "supports_function_calling": true, "supports_response_format": true, "latency_s": 1.09, "throughput_tps": 27.53, "performance_tested_at": "2025-08-04T09:04:05.104Z" }, { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "HTTP 503 Service Temporarily Unavailable", "performance_tested_at": "2025-08-04T09:04:18.588Z" } ] }, { "id": "Qwen/Qwen3-4B", "object": "model", "created": 1745725289, "owned_by": "Qwen", "providers": [ { "provider": "nebius", "status": "live", "context_length": 40960, "pricing": { "input": 0.08, "output": 0.24 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 1.3, "throughput_tps": 135.55, "performance_tested_at": "2025-08-04T09:04:05.313Z" } ] }, { "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", "object": "model", "created": 1743600857, "owned_by": "meta-llama", "providers": [ { "provider": "novita", "status": "live", "context_length": 131072, "pricing": { "input": 0.1, "output": 0.5 }, "supports_tools": false, "supports_structured_output": false, "supports_function_calling": true, "latency_s": 0.81, "throughput_tps": 40.59, "performance_tested_at": "2025-08-04T09:04:04.828Z" }, { "provider": "cerebras", "status": "live", "pricing": { "input": 0.65, "output": 0.85 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 0.4, "throughput_tps": 88.53, "performance_tested_at": "2025-08-04T09:04:04.410Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 0.61, "throughput_tps": 52.16, "performance_tested_at": "2025-08-04T09:04:04.628Z" }, { "provider": "together", "status": "live", "context_length": 1048576, "pricing": { "input": 0.18000000000000002, "output": 0.5900000000000001 }, "supports_tools": true, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 0.34, "throughput_tps": 95.75, "performance_tested_at": "2025-08-04T09:04:04.359Z" }, { "provider": "groq", "status": "live", "context_length": 131072, "pricing": { "input": 0.11, "output": 0.34 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 0.26, "throughput_tps": 132.65, "performance_tested_at": "2025-08-04T09:04:04.271Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 0.61, "throughput_tps": 56.17, "performance_tested_at": "2025-08-04T09:04:04.620Z" } ] }, { "id": "meta-llama/Llama-3.2-1B-Instruct", "object": "model", "created": 1726672367, "owned_by": "meta-llama", "providers": [ { "provider": "novita", "status": "live", "context_length": 131000, "supports_tools": false, "supports_structured_output": false, "pricing": { "input": 0, "output": 0 }, "latency_s": 1.85, "throughput_tps": 39.99, "performance_tested_at": "2025-08-04T09:04:05.865Z" } ] }, { "id": "Qwen/Qwen2.5-7B-Instruct", "object": "model", "created": 1726487740, "owned_by": "Qwen", "providers": [ { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 4.79, "throughput_tps": 5.84, "performance_tested_at": "2025-08-04T09:04:08.809Z" }, { "provider": "together", "status": "live", "context_length": 32768, "pricing": { "input": 0.3, "output": 0.3 }, "supports_tools": true, "supports_structured_output": false, "supports_stop_sequences": true, "latency_s": 0.41, "throughput_tps": 136.18, "performance_tested_at": "2025-08-04T09:04:04.426Z" } ] }, { "id": "Qwen/Qwen3-14B", "object": "model", "created": 1745725365, "owned_by": "Qwen", "providers": [ { "provider": "nebius", "status": "live", "context_length": 40960, "pricing": { "input": 0.08, "output": 0.24 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 10.15, "throughput_tps": 68.28, "performance_tested_at": "2025-08-04T09:04:14.164Z" }, { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "HTTP 503 Service Temporarily Unavailable", "performance_tested_at": "2025-08-04T09:04:19.084Z" } ] }, { "id": "baidu/ERNIE-4.5-21B-A3B-PT", "object": "model", "created": 1751091210, "owned_by": "baidu", "providers": [ { "provider": "novita", "status": "live", "context_length": 120000, "pricing": { "input": 0.07, "output": 0.28 }, "supports_tools": false, "supports_structured_output": false, "supports_function_calling": true, "latency_s": 1.31, "throughput_tps": 27.4, "performance_tested_at": "2025-08-04T09:04:05.328Z" } ] }, { "id": "meta-llama/Llama-3.1-70B-Instruct", "object": "model", "created": 1721146066, "owned_by": "meta-llama", "providers": [ { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.13, "output": 0.4 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 0.58, "throughput_tps": 54.96, "performance_tested_at": "2025-08-04T09:04:20.668Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 0.78, "throughput_tps": 47.23, "performance_tested_at": "2025-08-04T09:04:20.869Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 1.18, "throughput_tps": 28.87, "performance_tested_at": "2025-08-04T09:04:21.263Z" } ] }, { "id": "baidu/ERNIE-4.5-VL-28B-A3B-PT", "object": "model", "created": 1751089833, "owned_by": "baidu", "providers": [ { "provider": "novita", "status": "live", "context_length": 30000, "pricing": { "input": 0.14, "output": 0.56 }, "supports_tools": false, "supports_structured_output": false, "supports_function_calling": true, "latency_s": 1.08, "throughput_tps": 36.93, "performance_tested_at": "2025-08-04T09:04:21.169Z" } ] }, { "id": "Qwen/Qwen2.5-Coder-32B-Instruct", "object": "model", "created": 1730879390, "owned_by": "Qwen", "providers": [ { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.1, "output": 0.3 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 1.05, "throughput_tps": 53.37, "performance_tested_at": "2025-08-04T09:04:21.135Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 6.82, "throughput_tps": 4.1, "performance_tested_at": "2025-08-04T09:04:26.911Z" }, { "provider": "together", "status": "live", "context_length": 16384, "pricing": { "input": 0.8, "output": 0.8 }, "supports_tools": true, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 0.45, "throughput_tps": 121.89, "performance_tested_at": "2025-08-04T09:04:20.537Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 1.09, "throughput_tps": 32.12, "performance_tested_at": "2025-08-04T09:04:21.175Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 0.91, "throughput_tps": 60.36, "performance_tested_at": "2025-08-04T09:04:20.997Z" } ] }, { "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "object": "model", "created": 1737364574, "owned_by": "deepseek-ai", "providers": [ { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:04:50.087Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 4.11, "throughput_tps": 73.52, "performance_tested_at": "2025-08-04T09:04:24.193Z" } ] }, { "id": "google/gemma-2-9b-it", "object": "model", "created": 1719216341, "owned_by": "google", "providers": [ { "provider": "nebius", "status": "live", "context_length": 8192, "pricing": { "input": 0.03, "output": 0.09 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.98, "throughput_tps": 41.96, "performance_tested_at": "2025-08-04T09:04:21.063Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 7.92, "throughput_tps": 3.91, "performance_tested_at": "2025-08-04T09:04:28.009Z" }, { "provider": "groq", "status": "live", "context_length": 8192, "pricing": { "input": 0.2, "output": 0.2 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 0.4, "throughput_tps": 92.08, "performance_tested_at": "2025-08-04T09:04:20.488Z" } ] }, { "id": "deepseek-ai/DeepSeek-V3", "object": "model", "created": 1735131143, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "context_length": 64000, "pricing": { "input": 0.4, "output": 1.3 }, "supports_tools": true, "supports_structured_output": false, "supports_function_calling": true, "supports_response_format": true, "latency_s": 1.69, "throughput_tps": 23.1, "performance_tested_at": "2025-08-04T09:04:21.774Z" }, { "provider": "nebius", "status": "live", "context_length": 163840, "pricing": { "input": 0.5, "output": 1.5 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.62, "throughput_tps": 46.9, "performance_tested_at": "2025-08-04T09:04:20.704Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 0.74, "throughput_tps": 79.62, "performance_tested_at": "2025-08-04T09:04:20.827Z" }, { "provider": "together", "status": "live", "context_length": 131072, "pricing": { "input": 1.25, "output": 1.25 }, "supports_tools": true, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 2.79, "throughput_tps": 14.32, "performance_tested_at": "2025-08-04T09:04:22.880Z" } ] }, { "id": "CohereLabs/aya-vision-8b", "object": "model", "created": 1740938806, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 0.97, "throughput_tps": 71.32, "performance_tested_at": "2025-08-04T09:04:21.053Z" } ] }, { "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct", "object": "model", "created": 1743545840, "owned_by": "meta-llama", "providers": [ { "provider": "cerebras", "status": "live", "pricing": { "input": 0.2, "output": 0.6 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 0.42, "throughput_tps": 79.35, "performance_tested_at": "2025-08-04T09:04:20.502Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 0.53, "throughput_tps": 66.2, "performance_tested_at": "2025-08-04T09:04:51.617Z" }, { "provider": "groq", "status": "live", "context_length": 131072, "pricing": { "input": 0.2, "output": 0.6 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 0.3, "throughput_tps": 108.71, "performance_tested_at": "2025-08-04T09:04:51.392Z" }, { "provider": "sambanova", "status": "live", "context_length": 131072, "pricing": { "input": 0.63, "output": 1.8 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 0.53, "throughput_tps": 191.12, "performance_tested_at": "2025-08-04T09:04:51.616Z" } ] }, { "id": "MiniMaxAI/MiniMax-M1-80k", "object": "model", "created": 1749802874, "owned_by": "MiniMaxAI", "providers": [ { "provider": "novita", "status": "live", "context_length": 1000000, "pricing": { "input": 0.55, "output": 2.2 }, "supports_tools": false, "supports_structured_output": false, "supports_function_calling": true, "latency_s": 21.58, "throughput_tps": 45.27, "performance_tested_at": "2025-08-04T09:05:12.669Z" } ] }, { "id": "CohereLabs/aya-expanse-8b", "object": "model", "created": 1729665253, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 0.71, "throughput_tps": 105.19, "performance_tested_at": "2025-08-04T09:04:51.801Z" } ] }, { "id": "Qwen/Qwen2.5-Coder-7B-Instruct", "object": "model", "created": 1726580329, "owned_by": "Qwen", "providers": [ { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "HTTP 503 Service Temporarily Unavailable", "performance_tested_at": "2025-08-04T09:05:07.614Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 0.85, "throughput_tps": 63.37, "performance_tested_at": "2025-08-04T09:04:51.940Z" } ] }, { "id": "CohereLabs/c4ai-command-a-03-2025", "object": "model", "created": 1741684205, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 0.58, "throughput_tps": 96.87, "performance_tested_at": "2025-08-04T09:04:51.666Z" } ] }, { "id": "Qwen/Qwen2.5-Coder-3B-Instruct", "object": "model", "created": 1730879378, "owned_by": "Qwen", "providers": [ { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 0.79, "throughput_tps": 68.71, "performance_tested_at": "2025-08-04T09:04:51.874Z" } ] }, { "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", "object": "model", "created": 1737364413, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "context_length": 32000, "pricing": { "input": 0.8, "output": 0.8 }, "supports_tools": false, "supports_structured_output": false, "supports_response_format": true, "latency_s": 18.11, "throughput_tps": 31.42, "performance_tested_at": "2025-08-04T09:05:09.196Z" }, { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.25, "output": 0.75 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 3.35, "throughput_tps": 56.96, "performance_tested_at": "2025-08-04T09:04:54.442Z" }, { "provider": "cerebras", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 0.67, "throughput_tps": 533.14, "performance_tested_at": "2025-08-04T09:04:51.756Z" }, { "provider": "groq", "status": "live", "context_length": 131072, "pricing": { "input": 0.75, "output": 0.99 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 1.15, "throughput_tps": 184.17, "performance_tested_at": "2025-08-04T09:04:52.239Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 16.44, "throughput_tps": 24.7, "performance_tested_at": "2025-08-04T09:05:07.527Z" }, { "provider": "sambanova", "status": "live", "context_length": 131072, "pricing": { "input": 0.7, "output": 1.4 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 4.13, "throughput_tps": 152.64, "performance_tested_at": "2025-08-04T09:04:55.228Z" } ] }, { "id": "Qwen/Qwen3-235B-A22B", "object": "model", "created": 1745726026, "owned_by": "Qwen", "providers": [ { "provider": "novita", "status": "live", "context_length": 40960, "pricing": { "input": 0.2, "output": 0.8 }, "supports_tools": false, "supports_structured_output": false, "supports_function_calling": true, "supports_response_format": true, "latency_s": 3.49, "throughput_tps": 11.74, "performance_tested_at": "2025-08-04T09:04:54.579Z" }, { "provider": "nebius", "status": "live", "context_length": 40960, "pricing": { "input": 0.2, "output": 0.6 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 25.47, "throughput_tps": 24.38, "performance_tested_at": "2025-08-04T09:05:16.561Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 10.41, "throughput_tps": 85.4, "performance_tested_at": "2025-08-04T09:05:01.498Z" }, { "provider": "together", "status": "live", "context_length": 40960, "pricing": { "input": 0.2, "output": 0.6 }, "supports_tools": true, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 9.38, "throughput_tps": 39.23, "performance_tested_at": "2025-08-04T09:05:00.469Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 14.06, "throughput_tps": 32.36, "performance_tested_at": "2025-08-04T09:05:05.147Z" } ] }, { "id": "aaditya/Llama3-OpenBioLLM-70B", "object": "model", "created": 1713925272, "owned_by": "aaditya", "providers": [ { "provider": "nebius", "status": "live", "context_length": 8192, "pricing": { "input": 0.13, "output": 0.4 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.62, "throughput_tps": 53.54, "performance_tested_at": "2025-08-04T09:05:18.179Z" } ] }, { "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "object": "model", "created": 1737364182, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "context_length": 32000, "pricing": { "input": 0.04, "output": 0.04 }, "supports_tools": false, "supports_structured_output": true, "supports_response_format": true, "latency_s": 18.76, "throughput_tps": 34, "performance_tested_at": "2025-08-04T09:05:36.326Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 8.69, "throughput_tps": 3.91, "performance_tested_at": "2025-08-04T09:05:26.250Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 5.76, "throughput_tps": 70.16, "performance_tested_at": "2025-08-04T09:05:23.321Z" } ] }, { "id": "microsoft/phi-4", "object": "model", "created": 1733917649, "owned_by": "microsoft", "providers": [ { "provider": "nebius", "status": "live", "context_length": 16384, "pricing": { "input": 0.1, "output": 0.3 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.47, "throughput_tps": 65.45, "performance_tested_at": "2025-08-04T09:05:18.036Z" } ] }, { "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "object": "model", "created": 1737364740, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "context_length": 64000, "pricing": { "input": 0.3, "output": 0.3 }, "supports_tools": false, "supports_structured_output": true, "supports_response_format": true, "latency_s": 4.01, "throughput_tps": 43.93, "performance_tested_at": "2025-08-04T09:05:21.569Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 15.95, "throughput_tps": 28.39, "performance_tested_at": "2025-08-04T09:05:33.516Z" } ] }, { "id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", "object": "model", "created": 1744051630, "owned_by": "nvidia", "providers": [ { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.6, "output": 1.8 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 3.78, "throughput_tps": 46.3, "performance_tested_at": "2025-08-04T09:05:21.342Z" } ] }, { "id": "meta-llama/Meta-Llama-3-70B-Instruct", "object": "model", "created": 1713346494, "owned_by": "meta-llama", "providers": [ { "provider": "novita", "status": "live", "context_length": 8192, "pricing": { "input": 0.51, "output": 0.74 }, "supports_tools": false, "supports_structured_output": true, "supports_function_calling": true, "supports_response_format": true, "latency_s": 1.46, "throughput_tps": 24.04, "performance_tested_at": "2025-08-04T09:05:19.018Z" }, { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:05:47.564Z" }, { "provider": "together", "status": "live", "context_length": 8192, "pricing": { "input": 0.88, "output": 0.88 }, "supports_tools": false, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 0.48, "throughput_tps": 73.58, "performance_tested_at": "2025-08-04T09:05:18.038Z" }, { "provider": "groq", "status": "live", "context_length": 8192, "pricing": { "input": 0.59, "output": 0.79 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 0.47, "throughput_tps": 71.77, "performance_tested_at": "2025-08-04T09:05:18.036Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 0.88, "throughput_tps": 36.54, "performance_tested_at": "2025-08-04T09:05:18.439Z" } ] }, { "id": "Sao10K/L3-8B-Stheno-v3.2", "object": "model", "created": 1717583457, "owned_by": "Sao10K", "providers": [ { "provider": "novita", "status": "live", "context_length": 8192, "pricing": { "input": 0.05, "output": 0.05 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 0.81, "throughput_tps": 49.44, "performance_tested_at": "2025-08-04T09:05:18.372Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 6.37, "throughput_tps": 4.39, "performance_tested_at": "2025-08-04T09:05:23.934Z" } ] }, { "id": "CohereLabs/c4ai-command-r-plus", "object": "model", "created": 1712150824, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 0.47, "throughput_tps": 54.88, "performance_tested_at": "2025-08-04T09:05:18.037Z" } ] }, { "id": "baidu/ERNIE-4.5-300B-A47B-Base-PT", "object": "model", "created": 1751089026, "owned_by": "baidu", "providers": [ { "provider": "novita", "status": "live", "context_length": 123000, "pricing": { "input": 0.28, "output": 1.1 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 1.22, "throughput_tps": 22.05, "performance_tested_at": "2025-08-04T09:05:18.787Z" } ] }, { "id": "Qwen/Qwen2.5-VL-32B-Instruct", "object": "model", "created": 1742570595, "owned_by": "Qwen", "providers": [ { "provider": "fireworks-ai", "status": "live", "supports_tools": false, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 1.7, "throughput_tps": 68.1, "performance_tested_at": "2025-08-04T09:05:19.266Z" } ] }, { "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "object": "model", "created": 1737364707, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "context_length": 64000, "pricing": { "input": 0.15, "output": 0.15 }, "supports_tools": false, "supports_structured_output": true, "supports_response_format": true, "latency_s": 13.62, "throughput_tps": 45.15, "performance_tested_at": "2025-08-04T09:05:31.183Z" }, { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:05:47.564Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": true, "latency_s": 15.28, "throughput_tps": 40.19, "performance_tested_at": "2025-08-04T09:06:03.844Z" } ] }, { "id": "CohereLabs/aya-expanse-32b", "object": "model", "created": 1729665764, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 0.9, "throughput_tps": 79.7, "performance_tested_at": "2025-08-04T09:05:49.469Z" } ] }, { "id": "baidu/ERNIE-4.5-0.3B-PT", "object": "model", "created": 1751091102, "owned_by": "baidu", "providers": [ { "provider": "novita", "status": "live", "context_length": 120000, "supports_tools": false, "supports_structured_output": false, "pricing": { "input": 0, "output": 0 }, "supports_function_calling": true, "latency_s": 1.9, "throughput_tps": 18.43, "performance_tested_at": "2025-08-04T09:05:50.465Z" } ] }, { "id": "Qwen/Qwen2.5-72B-Instruct", "object": "model", "created": 1726487791, "owned_by": "Qwen", "providers": [ { "provider": "novita", "status": "live", "context_length": 32000, "pricing": { "input": 0.38, "output": 0.4 }, "supports_tools": true, "supports_structured_output": false, "latency_s": 0.71, "throughput_tps": 78.41, "performance_tested_at": "2025-08-04T09:05:49.280Z" }, { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.25, "output": 0.75 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 0.43, "throughput_tps": 123.79, "performance_tested_at": "2025-08-04T09:05:48.994Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 20.56, "throughput_tps": 1.41, "performance_tested_at": "2025-08-04T09:06:09.123Z" }, { "provider": "together", "status": "live", "context_length": 131072, "pricing": { "input": 1.2, "output": 1.2 }, "supports_tools": true, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 1.39, "throughput_tps": 40.24, "performance_tested_at": "2025-08-04T09:05:49.957Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 1.45, "throughput_tps": 24.06, "performance_tested_at": "2025-08-04T09:05:50.021Z" } ] }, { "id": "meta-llama/Llama-3.1-405B-Instruct", "object": "model", "created": 1721154284, "owned_by": "meta-llama", "providers": [ { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 1, "output": 3 }, "supports_tools": true, "supports_structured_output": true, "latency_s": 0.58, "throughput_tps": 100.83, "performance_tested_at": "2025-08-04T09:05:49.141Z" }, { "provider": "fireworks-ai", "status": "live", "supports_tools": true, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 0.5, "throughput_tps": 80.11, "performance_tested_at": "2025-08-04T09:05:49.065Z" }, { "provider": "sambanova", "status": "live", "supports_tools": true, "supports_structured_output": true, "latency_s": 0.71, "throughput_tps": 80.75, "performance_tested_at": "2025-08-04T09:05:49.272Z" } ] }, { "id": "Qwen/Qwen3-235B-A22B-FP8", "object": "model", "created": 1745850968, "owned_by": "Qwen", "providers": [ { "provider": "together", "status": "live", "context_length": 40960, "pricing": { "input": 0.2, "output": 0.6 }, "supports_tools": true, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 19.92, "throughput_tps": 37.15, "performance_tested_at": "2025-08-04T09:06:08.483Z" } ] }, { "id": "baidu/ERNIE-4.5-VL-424B-A47B-Base-PT", "object": "model", "created": 1751089776, "owned_by": "baidu", "providers": [ { "provider": "novita", "status": "live", "context_length": 123000, "pricing": { "input": 0.42, "output": 1.25 }, "supports_tools": false, "supports_structured_output": false, "supports_function_calling": true, "latency_s": 4.24, "throughput_tps": 17.43, "performance_tested_at": "2025-08-04T09:05:52.811Z" } ] }, { "id": "Qwen/Qwen2-VL-72B-Instruct", "object": "model", "created": 1726547134, "owned_by": "Qwen", "providers": [ { "provider": "nebius", "status": "live", "context_length": 32768, "pricing": { "input": 0.13, "output": 0.4 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.78, "throughput_tps": 57.62, "performance_tested_at": "2025-08-04T09:05:49.347Z" } ] }, { "id": "Qwen/Qwen2.5-Coder-7B", "object": "model", "created": 1726487844, "owned_by": "Qwen", "providers": [ { "provider": "nebius", "status": "live", "context_length": 32768, "pricing": { "input": 0.03, "output": 0.09 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.34, "throughput_tps": 157.48, "performance_tested_at": "2025-08-04T09:05:48.909Z" }, { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:06:18.567Z" } ] }, { "id": "CohereLabs/aya-vision-32b", "object": "model", "created": 1740951400, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 1.65, "throughput_tps": 61.32, "performance_tested_at": "2025-08-04T09:05:50.213Z" } ] }, { "id": "CohereLabs/c4ai-command-r7b-arabic-02-2025", "object": "model", "created": 1740643869, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 0.38, "throughput_tps": 71.48, "performance_tested_at": "2025-08-04T09:05:48.944Z" } ] }, { "id": "Qwen/Qwen2.5-VL-72B-Instruct", "object": "model", "created": 1737951124, "owned_by": "Qwen", "providers": [ { "provider": "nebius", "status": "live", "context_length": 32000, "pricing": { "input": 0.25, "output": 0.75 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.84, "throughput_tps": 54.47, "performance_tested_at": "2025-08-04T09:05:49.411Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 2.01, "throughput_tps": 22.44, "performance_tested_at": "2025-08-04T09:05:50.571Z" } ] }, { "id": "NousResearch/Hermes-2-Pro-Llama-3-8B", "object": "model", "created": 1714436178, "owned_by": "NousResearch", "providers": [ { "provider": "novita", "status": "live", "context_length": 8192, "pricing": { "input": 0.14, "output": 0.14 }, "supports_tools": false, "supports_structured_output": false, "supports_response_format": true, "latency_s": 0.88, "throughput_tps": 36.33, "performance_tested_at": "2025-08-04T09:06:20.450Z" } ] }, { "id": "Qwen/QwQ-32B", "object": "model", "created": 1741184219, "owned_by": "Qwen", "providers": [ { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.5, "output": 1.5 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 5.45, "throughput_tps": 84.72, "performance_tested_at": "2025-08-04T09:06:25.022Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 20.12, "throughput_tps": 7.75, "performance_tested_at": "2025-08-04T09:06:39.689Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 3.11, "throughput_tps": 100.76, "performance_tested_at": "2025-08-04T09:06:22.676Z" }, { "provider": "nscale", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 9.71, "throughput_tps": 29.35, "performance_tested_at": "2025-08-04T09:06:29.281Z" } ] }, { "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", "object": "model", "created": 1743540422, "owned_by": "meta-llama", "providers": [ { "provider": "novita", "status": "live", "context_length": 1048576, "pricing": { "input": 0.17, "output": 0.85 }, "supports_tools": true, "supports_structured_output": false, "supports_function_calling": true, "latency_s": 0.74, "throughput_tps": 45.65, "performance_tested_at": "2025-08-04T09:06:20.314Z" }, { "provider": "together", "status": "live", "context_length": 1048576, "pricing": { "input": 0.27, "output": 0.85 }, "supports_tools": true, "supports_structured_output": false, "supports_stop_sequences": true, "latency_s": 0.45, "throughput_tps": 76.02, "performance_tested_at": "2025-08-04T09:06:20.017Z" } ] }, { "id": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO", "object": "model", "created": 1704953687, "owned_by": "NousResearch", "providers": [ { "provider": "together", "status": "live", "context_length": 32768, "pricing": { "input": 0.6, "output": 0.6 }, "supports_tools": false, "supports_structured_output": false, "supports_stop_sequences": true, "latency_s": 0.96, "throughput_tps": 40.47, "performance_tested_at": "2025-08-04T09:06:20.533Z" } ] }, { "id": "Sao10K/L3-70B-Euryale-v2.1", "object": "model", "created": 1718134069, "owned_by": "Sao10K", "providers": [ { "provider": "novita", "status": "live", "context_length": 8192, "pricing": { "input": 1.48, "output": 1.48 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 0.92, "throughput_tps": 37.01, "performance_tested_at": "2025-08-04T09:06:20.488Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 11.41, "throughput_tps": 2.45, "performance_tested_at": "2025-08-04T09:06:30.977Z" } ] }, { "id": "Qwen/QwQ-32B-Preview", "object": "model", "created": 1732722655, "owned_by": "Qwen", "providers": [ { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 7.21, "throughput_tps": 4.16, "performance_tested_at": "2025-08-04T09:06:26.777Z" }, { "provider": "together", "status": "live", "supports_tools": true, "supports_structured_output": true, "pricing": { "input": 65, "output": 0 }, "context_length": 32768, "supports_stop_sequences": true, "latency_s": 2.93, "throughput_tps": 97.22, "performance_tested_at": "2025-08-04T09:06:22.501Z" } ] }, { "id": "deepseek-ai/DeepSeek-Prover-V2-671B", "object": "model", "created": 1745993675, "owned_by": "deepseek-ai", "providers": [ { "provider": "novita", "status": "live", "context_length": 160000, "pricing": { "input": 0.7, "output": 2.5 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 1.87, "throughput_tps": 21.37, "performance_tested_at": "2025-08-04T09:06:21.441Z" } ] }, { "id": "marin-community/marin-8b-instruct", "object": "model", "created": 1747241066, "owned_by": "marin-community", "providers": [ { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 7.63, "throughput_tps": 3.67, "performance_tested_at": "2025-08-04T09:06:27.201Z" }, { "provider": "together", "status": "live", "context_length": 4096, "pricing": { "input": 0.18000000000000002, "output": 0.18000000000000002 }, "supports_tools": false, "supports_structured_output": true, "supports_stop_sequences": true, "latency_s": 0.62, "throughput_tps": 693.1, "performance_tested_at": "2025-08-04T09:06:20.185Z" } ] }, { "id": "SentientAGI/Dobby-Unhinged-Llama-3.3-70B", "object": "model", "created": 1739304442, "owned_by": "SentientAGI", "providers": [ { "provider": "fireworks-ai", "status": "live", "supports_tools": false, "supports_structured_output": false, "context_length": 163840, "supports_image_input": false, "supports_function_calling": false, "latency_s": 1.03, "throughput_tps": 72.04, "performance_tested_at": "2025-08-04T09:06:20.597Z" } ] }, { "id": "NousResearch/Hermes-3-Llama-3.1-405B", "object": "model", "created": 1723525073, "owned_by": "NousResearch", "providers": [ { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 1, "output": 3 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 4.41, "throughput_tps": 32.23, "performance_tested_at": "2025-08-04T09:06:23.975Z" } ] }, { "id": "alpindale/WizardLM-2-8x22B", "object": "model", "created": 1713235019, "owned_by": "alpindale", "providers": [ { "provider": "novita", "status": "live", "context_length": 65535, "pricing": { "input": 0.62, "output": 0.62 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 4.41, "throughput_tps": 23.38, "performance_tested_at": "2025-08-04T09:06:23.975Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 4.02, "throughput_tps": 11.94, "performance_tested_at": "2025-08-04T09:06:23.589Z" } ] }, { "id": "meta-llama/Llama-Guard-4-12B", "object": "model", "created": 1745407825, "owned_by": "meta-llama", "providers": [ { "provider": "groq", "status": "live", "context_length": 131072, "pricing": { "input": 0.2, "output": 0.2 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 0.39, "throughput_tps": 557.65, "performance_tested_at": "2025-08-04T09:06:19.959Z" } ] }, { "id": "Qwen/Qwen2.5-32B-Instruct", "object": "model", "created": 1726546675, "owned_by": "Qwen", "providers": [ { "provider": "nebius", "status": "live", "context_length": 131072, "pricing": { "input": 0.13, "output": 0.4 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 0.37, "throughput_tps": 150.33, "performance_tested_at": "2025-08-04T09:06:41.063Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 7.41, "throughput_tps": 3.92, "performance_tested_at": "2025-08-04T09:06:48.097Z" } ] }, { "id": "dphn/dolphin-2.9.2-mixtral-8x22b", "object": "model", "created": 1716934597, "owned_by": "dphn", "providers": [ { "provider": "novita", "status": "live", "context_length": 16000, "pricing": { "input": 0.9, "output": 0.9 }, "supports_tools": false, "supports_structured_output": false, "latency_s": 3.73, "throughput_tps": 25.48, "performance_tested_at": "2025-08-04T09:06:44.419Z" } ] }, { "id": "Qwen/Qwen2-72B-Instruct", "object": "model", "created": 1716868129, "owned_by": "Qwen", "providers": [ { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:07:10.691Z" }, { "provider": "together", "status": "live", "context_length": 32768, "pricing": { "input": 0.9, "output": 0.9 }, "supports_tools": false, "supports_structured_output": false, "supports_stop_sequences": true, "latency_s": 0.68, "throughput_tps": 64.82, "performance_tested_at": "2025-08-04T09:06:41.369Z" } ] }, { "id": "NousResearch/Hermes-3-Llama-3.1-70B", "object": "model", "created": 1722263277, "owned_by": "NousResearch", "providers": [ { "provider": "featherless-ai", "status": "offline", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "performance_error": "Request timeout", "performance_tested_at": "2025-08-04T09:07:10.691Z" }, { "provider": "hyperbolic", "status": "live", "supports_tools": false, "supports_structured_output": false, "latency_s": 26.93, "throughput_tps": 4.35, "performance_tested_at": "2025-08-04T09:07:07.615Z" } ] }, { "id": "Sao10K/L3-8B-Lunaris-v1", "object": "model", "created": 1719362412, "owned_by": "Sao10K", "providers": [ { "provider": "novita", "status": "live", "context_length": 8192, "pricing": { "input": 0.05, "output": 0.05 }, "supports_tools": false, "supports_structured_output": false, "supports_response_format": true, "latency_s": 1.01, "throughput_tps": 32.63, "performance_tested_at": "2025-08-04T09:06:41.702Z" }, { "provider": "featherless-ai", "status": "live", "pricing": { "input": 0.1, "output": 0.1 }, "context_length": 16384, "latency_s": 8.55, "throughput_tps": 3.51, "performance_tested_at": "2025-08-04T09:06:49.238Z" } ] }, { "id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", "object": "model", "created": 1728700633, "owned_by": "nvidia", "providers": [ { "provider": "together", "status": "live", "context_length": 32768, "pricing": { "input": 0.88, "output": 0.88 }, "supports_tools": true, "supports_structured_output": false, "supports_stop_sequences": true, "latency_s": 1.43, "throughput_tps": 74.25, "performance_tested_at": "2025-08-04T09:06:42.118Z" } ] }, { "id": "CohereLabs/c4ai-command-r-v01", "object": "model", "created": 1710172254, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 0.72, "throughput_tps": 109.72, "performance_tested_at": "2025-08-04T09:06:41.410Z" } ] }, { "id": "tokyotech-llm/Llama-3.3-Swallow-70B-Instruct-v0.4", "object": "model", "created": 1740976430, "owned_by": "tokyotech-llm", "providers": [ { "provider": "sambanova", "status": "live", "context_length": 131072, "pricing": { "input": 0.6, "output": 1.2 }, "supports_tools": false, "supports_structured_output": true, "latency_s": 2.99, "throughput_tps": 11.36, "performance_tested_at": "2025-08-04T09:06:43.683Z" } ] }, { "id": "CohereLabs/c4ai-command-r-08-2024", "object": "model", "created": 1724053211, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 0.44, "throughput_tps": 59.12, "performance_tested_at": "2025-08-04T09:06:41.130Z" } ] }, { "id": "CohereLabs/c4ai-command-r7b-12-2024", "object": "model", "created": 1733932505, "owned_by": "CohereLabs", "providers": [ { "provider": "cohere", "status": "live", "supports_tools": true, "supports_structured_output": false, "latency_s": 0.32, "throughput_tps": 77.16, "performance_tested_at": "2025-08-04T09:06:41.014Z" } ] } ], "generated_at": "2025-08-04T09:07:10.692Z", "metadata": { "total_models": 91, "models_enriched": 75, "providers_enriched": 145, "performance_tested": true, "providers_fetched": { "novita": 52, "sambanova": 10, "groq": 21, "featherless": 5748, "together": 90, "cohere": 0, "fireworks": 32, "nebius": 0, "hyperbolic": 0, "cerebras": 0, "nscale": 0 } } }