inference-metrics / enriched_models_enhanced.json
victor's picture
victor HF Staff
Upload folder using huggingface_hub
15a5288 verified
{
"data": [
{
"id": "zai-org/GLM-4.5",
"object": "model",
"created": 1752981936,
"owned_by": "zai-org",
"providers": [
{
"provider": "novita",
"status": "live",
"pricing": {
"input": 60,
"output": 220
},
"context_length": 131072,
"supports_tools": true,
"supports_structured_output": true,
"supports_response_format": true,
"supports_function_calling": true,
"latency_s": 5.95,
"throughput_tps": 48.9,
"performance_tested_at": "2025-08-04T09:02:05.950Z"
}
]
},
{
"id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
"object": "model",
"created": 1753195958,
"owned_by": "Qwen",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 262144,
"pricing": {
"input": 0.95,
"output": 5
},
"supports_tools": true,
"supports_structured_output": false,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 1.47,
"throughput_tps": 21.09,
"performance_tested_at": "2025-08-04T09:02:01.469Z"
},
{
"provider": "cerebras",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 4.5,
"throughput_tps": 7.77,
"performance_tested_at": "2025-08-04T09:02:04.503Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 0.7,
"throughput_tps": 48.7,
"performance_tested_at": "2025-08-04T09:02:00.698Z"
},
{
"provider": "together",
"status": "live",
"context_length": 262144,
"pricing": {
"input": 2,
"output": 2
},
"supports_tools": false,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 10,
"throughput_tps": 3.4,
"performance_tested_at": "2025-08-04T09:02:09.996Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 3.2,
"throughput_tps": 10.64,
"performance_tested_at": "2025-08-04T09:02:03.196Z"
}
]
},
{
"id": "moonshotai/Kimi-K2-Instruct",
"object": "model",
"created": 1752195312,
"owned_by": "moonshotai",
"providers": [
{
"provider": "novita",
"status": "live",
"pricing": {
"input": 57,
"output": 230
},
"context_length": 131072,
"supports_tools": true,
"supports_structured_output": true,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 1.06,
"throughput_tps": 28.42,
"performance_tested_at": "2025-08-04T09:02:01.055Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 1.07,
"throughput_tps": 37.37,
"performance_tested_at": "2025-08-04T09:02:01.070Z"
},
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "HTTP 400 Bad Request",
"performance_tested_at": "2025-08-04T09:02:02.113Z"
},
{
"provider": "groq",
"status": "live",
"context_length": 131072,
"latency_s": 0.37,
"throughput_tps": 131.18,
"performance_tested_at": "2025-08-04T09:02:00.366Z"
}
]
},
{
"id": "Qwen/Qwen3-235B-A22B-Thinking-2507",
"object": "model",
"created": 1753419545,
"owned_by": "Qwen",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.3,
"output": 3
},
"supports_tools": true,
"supports_structured_output": false,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 6.76,
"throughput_tps": 78.85,
"performance_tested_at": "2025-08-04T09:02:06.760Z"
},
{
"provider": "cerebras",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.96,
"throughput_tps": 355.8,
"performance_tested_at": "2025-08-04T09:02:00.955Z"
}
]
},
{
"id": "CohereLabs/command-a-vision-07-2025",
"object": "model",
"created": 1753689307,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 1.69,
"throughput_tps": 44.37,
"performance_tested_at": "2025-08-04T09:02:01.690Z"
}
]
},
{
"id": "Qwen/Qwen3-235B-A22B-Instruct-2507",
"object": "model",
"created": 1753080416,
"owned_by": "Qwen",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 262144,
"pricing": {
"input": 0.15,
"output": 0.8
},
"supports_tools": true,
"supports_structured_output": true,
"supports_response_format": true,
"supports_function_calling": true,
"latency_s": 0.77,
"throughput_tps": 44.37,
"performance_tested_at": "2025-08-04T09:02:00.766Z"
},
{
"provider": "nebius",
"status": "offline",
"supports_tools": true,
"supports_structured_output": true,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:02:30.001Z"
},
{
"provider": "cerebras",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.49,
"throughput_tps": 70.83,
"performance_tested_at": "2025-08-04T09:02:00.494Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 0.79,
"throughput_tps": 43.05,
"performance_tested_at": "2025-08-04T09:02:00.789Z"
},
{
"provider": "together",
"status": "live",
"context_length": 262144,
"pricing": {
"input": 0.2,
"output": 0.6
},
"supports_tools": true,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 0.67,
"throughput_tps": 48.91,
"performance_tested_at": "2025-08-04T09:02:00.674Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 1.75,
"throughput_tps": 20,
"performance_tested_at": "2025-08-04T09:02:01.750Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.75,
"throughput_tps": 42.6,
"performance_tested_at": "2025-08-04T09:02:00.751Z"
}
]
},
{
"id": "meta-llama/Llama-3.1-8B-Instruct",
"object": "model",
"created": 1721292960,
"owned_by": "meta-llama",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 16384,
"pricing": {
"input": 0.02,
"output": 0.05
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.81,
"throughput_tps": 72.84,
"performance_tested_at": "2025-08-04T09:02:31.814Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.03,
"output": 0.09
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.44,
"throughput_tps": 72.65,
"performance_tested_at": "2025-08-04T09:02:31.445Z"
},
{
"provider": "cerebras",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.46,
"throughput_tps": 127.5,
"performance_tested_at": "2025-08-04T09:02:31.467Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 0.38,
"throughput_tps": 86.94,
"performance_tested_at": "2025-08-04T09:02:31.384Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 7.23,
"throughput_tps": 3.87,
"performance_tested_at": "2025-08-04T09:02:38.233Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 1.39,
"throughput_tps": 23.76,
"performance_tested_at": "2025-08-04T09:02:32.395Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.7,
"throughput_tps": 82.27,
"performance_tested_at": "2025-08-04T09:02:31.711Z"
},
{
"provider": "sambanova",
"status": "live",
"context_length": 16384,
"pricing": {
"input": 0.1,
"output": 0.2
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.53,
"throughput_tps": 107.02,
"performance_tested_at": "2025-08-04T09:02:31.539Z"
}
]
},
{
"id": "zai-org/GLM-4.5-Air-FP8",
"object": "model",
"created": 1752982200,
"owned_by": "zai-org",
"providers": [
{
"provider": "together",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"pricing": {
"input": 65,
"output": 0
},
"context_length": 32768,
"supports_stop_sequences": true,
"latency_s": 2.67,
"throughput_tps": 99.6,
"performance_tested_at": "2025-08-04T09:02:33.677Z"
}
]
},
{
"id": "HuggingFaceTB/SmolLM3-3B",
"object": "model",
"created": 1751969505,
"owned_by": "HuggingFaceTB",
"providers": [
{
"provider": "hf-inference",
"status": "offline",
"supports_tools": true,
"supports_structured_output": true,
"performance_error": "HTTP 404 Not Found",
"performance_tested_at": "2025-08-04T09:02:31.217Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-R1",
"object": "model",
"created": 1737344767,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 64000,
"pricing": {
"input": 0.7,
"output": 2.5
},
"supports_tools": true,
"supports_structured_output": false,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 6.51,
"throughput_tps": 23.35,
"performance_tested_at": "2025-08-04T09:02:37.516Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 163840,
"pricing": {
"input": 2,
"output": 6
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 3.92,
"throughput_tps": 71.42,
"performance_tested_at": "2025-08-04T09:02:34.927Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 3.73,
"throughput_tps": 70.06,
"performance_tested_at": "2025-08-04T09:02:34.732Z"
},
{
"provider": "together",
"status": "offline",
"context_length": 163840,
"pricing": {
"input": 3,
"output": 7
},
"supports_tools": false,
"supports_structured_output": true,
"supports_stop_sequences": true,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:03:01.007Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 3.35,
"throughput_tps": 56.99,
"performance_tested_at": "2025-08-04T09:02:34.358Z"
},
{
"provider": "sambanova",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"pricing": {
"input": 5,
"output": 7
},
"context_length": 32768,
"latency_s": 14.05,
"throughput_tps": 118.05,
"performance_tested_at": "2025-08-04T09:02:45.120Z"
}
]
},
{
"id": "Qwen/Qwen3-30B-A3B",
"object": "model",
"created": 1745725385,
"owned_by": "Qwen",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.1,
"output": 0.45
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 24.67,
"throughput_tps": 12.36,
"performance_tested_at": "2025-08-04T09:02:55.679Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.3,
"output": 0.9
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 2.38,
"throughput_tps": 124.51,
"performance_tested_at": "2025-08-04T09:02:33.384Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 2,
"throughput_tps": 111.18,
"performance_tested_at": "2025-08-04T09:02:33.003Z"
}
]
},
{
"id": "Qwen/Qwen3-8B",
"object": "model",
"created": 1745725341,
"owned_by": "Qwen",
"providers": [
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 9.66,
"throughput_tps": 18.84,
"performance_tested_at": "2025-08-04T09:02:40.667Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 3.77,
"throughput_tps": 62.78,
"performance_tested_at": "2025-08-04T09:03:05.784Z"
}
]
},
{
"id": "google/gemma-3-27b-it",
"object": "model",
"created": 1740856219,
"owned_by": "google",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 110000,
"pricing": {
"input": 0.2,
"output": 0.6
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.46,
"throughput_tps": 75.3,
"performance_tested_at": "2025-08-04T09:03:02.474Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 16.71,
"throughput_tps": 3.83,
"performance_tested_at": "2025-08-04T09:03:18.719Z"
}
]
},
{
"id": "zai-org/GLM-4.1V-9B-Thinking",
"object": "model",
"created": 1751120650,
"owned_by": "zai-org",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 65536,
"pricing": {
"input": 0.035,
"output": 0.138
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 1.31,
"throughput_tps": 70.18,
"performance_tested_at": "2025-08-04T09:03:03.320Z"
}
]
},
{
"id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
"object": "model",
"created": 1753197829,
"owned_by": "Qwen",
"providers": [
{
"provider": "together",
"status": "live",
"context_length": 262144,
"pricing": {
"input": 2,
"output": 2
},
"supports_tools": false,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 1.1,
"throughput_tps": 31.9,
"performance_tested_at": "2025-08-04T09:03:03.107Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-R1-0528",
"object": "model",
"created": 1748425602,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"pricing": {
"input": 70,
"output": 250
},
"context_length": 163840,
"supports_tools": true,
"supports_structured_output": true,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 17.97,
"throughput_tps": 26.27,
"performance_tested_at": "2025-08-04T09:03:19.977Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.8,
"output": 2.4
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 11.03,
"throughput_tps": 28.74,
"performance_tested_at": "2025-08-04T09:03:13.038Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"context_length": 163840,
"supports_tools": false,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 1.03,
"throughput_tps": 82.88,
"performance_tested_at": "2025-08-04T09:03:03.035Z"
},
{
"provider": "together",
"status": "live",
"pricing": {
"input": 65,
"output": 0
},
"context_length": 32768,
"supports_stop_sequences": true,
"latency_s": 4.66,
"throughput_tps": 30.7,
"performance_tested_at": "2025-08-04T09:03:06.668Z"
},
{
"provider": "hyperbolic",
"status": "live",
"latency_s": 3.11,
"throughput_tps": 75.29,
"performance_tested_at": "2025-08-04T09:03:05.118Z"
},
{
"provider": "sambanova",
"status": "live",
"pricing": {
"input": 5,
"output": 7
},
"context_length": 32768,
"latency_s": 17.96,
"throughput_tps": 126.51,
"performance_tested_at": "2025-08-04T09:03:19.977Z"
}
]
},
{
"id": "Qwen/Qwen2.5-VL-7B-Instruct",
"object": "model",
"created": 1737883597,
"owned_by": "Qwen",
"providers": [
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.59,
"throughput_tps": 77.4,
"performance_tested_at": "2025-08-04T09:03:02.604Z"
}
]
},
{
"id": "meta-llama/Meta-Llama-3-8B-Instruct",
"object": "model",
"created": 1713346512,
"owned_by": "meta-llama",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.04,
"output": 0.04
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.97,
"throughput_tps": 59.51,
"performance_tested_at": "2025-08-04T09:03:02.984Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 4.55,
"throughput_tps": 6.6,
"performance_tested_at": "2025-08-04T09:03:06.556Z"
},
{
"provider": "groq",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.05,
"output": 0.08
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.51,
"throughput_tps": 71.01,
"performance_tested_at": "2025-08-04T09:03:02.517Z"
}
]
},
{
"id": "meta-llama/Llama-3.2-3B-Instruct",
"object": "model",
"created": 1726672760,
"owned_by": "meta-llama",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 32768,
"pricing": {
"input": 0.03,
"output": 0.05
},
"supports_tools": true,
"supports_structured_output": false,
"supports_function_calling": true,
"latency_s": 0.9,
"throughput_tps": 63.17,
"performance_tested_at": "2025-08-04T09:03:02.912Z"
},
{
"provider": "together",
"status": "offline",
"context_length": 131072,
"pricing": {
"input": 0.060000000000000005,
"output": 0.060000000000000005
},
"supports_tools": false,
"supports_structured_output": false,
"supports_stop_sequences": true,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:03:32.011Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 1.08,
"throughput_tps": 46.38,
"performance_tested_at": "2025-08-04T09:03:03.087Z"
}
]
},
{
"id": "Qwen/Qwen3-32B",
"object": "model",
"created": 1745725979,
"owned_by": "Qwen",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.1,
"output": 0.45
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 14.2,
"throughput_tps": 43.94,
"performance_tested_at": "2025-08-04T09:03:16.210Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.1,
"output": 0.3
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 11.13,
"throughput_tps": 32.16,
"performance_tested_at": "2025-08-04T09:03:13.142Z"
},
{
"provider": "cerebras",
"status": "live",
"pricing": {
"input": 0.4,
"output": 0.8
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.48,
"throughput_tps": 368.47,
"performance_tested_at": "2025-08-04T09:03:33.490Z"
},
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:04:03.013Z"
},
{
"provider": "groq",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.29,
"output": 0.59
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 1.25,
"throughput_tps": 186.18,
"performance_tested_at": "2025-08-04T09:03:34.264Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 10.08,
"throughput_tps": 28.57,
"performance_tested_at": "2025-08-04T09:03:43.093Z"
},
{
"provider": "sambanova",
"status": "live",
"context_length": 32768,
"pricing": {
"input": 0.4,
"output": 0.8
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 1.97,
"throughput_tps": 261.95,
"performance_tested_at": "2025-08-04T09:03:34.991Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
"object": "model",
"created": 1748516867,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 128000,
"pricing": {
"input": 0.06,
"output": 0.09
},
"supports_tools": false,
"supports_structured_output": false,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 6.38,
"throughput_tps": 85.84,
"performance_tested_at": "2025-08-04T09:03:39.396Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 9.96,
"throughput_tps": 0,
"performance_tested_at": "2025-08-04T09:03:42.973Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-V3-0324",
"object": "model",
"created": 1742808502,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 163840,
"pricing": {
"input": 0.28,
"output": 1.14
},
"supports_tools": true,
"supports_structured_output": false,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 2.15,
"throughput_tps": 19.11,
"performance_tested_at": "2025-08-04T09:03:35.158Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 163840,
"pricing": {
"input": 2,
"output": 6
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.88,
"throughput_tps": 48.6,
"performance_tested_at": "2025-08-04T09:03:33.897Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 1.41,
"throughput_tps": 49.77,
"performance_tested_at": "2025-08-04T09:03:34.419Z"
},
{
"provider": "together",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 1.25,
"output": 1.25
},
"supports_tools": true,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 1.37,
"throughput_tps": 29.89,
"performance_tested_at": "2025-08-04T09:03:34.385Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 1.5,
"throughput_tps": 27.37,
"performance_tested_at": "2025-08-04T09:03:34.510Z"
},
{
"provider": "sambanova",
"status": "live",
"context_length": 32768,
"pricing": {
"input": 3,
"output": 4.5
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 1.06,
"throughput_tps": 34.89,
"performance_tested_at": "2025-08-04T09:03:34.073Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
"object": "model",
"created": 1737363858,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 27.68,
"throughput_tps": 26.92,
"performance_tested_at": "2025-08-04T09:04:00.688Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 3.39,
"throughput_tps": 169.05,
"performance_tested_at": "2025-08-04T09:03:36.402Z"
}
]
},
{
"id": "meta-llama/Llama-3.3-70B-Instruct",
"object": "model",
"created": 1732637327,
"owned_by": "meta-llama",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.13,
"output": 0.39
},
"supports_tools": true,
"supports_structured_output": false,
"supports_function_calling": true,
"latency_s": 0.61,
"throughput_tps": 96.29,
"performance_tested_at": "2025-08-04T09:03:33.625Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.25,
"output": 0.75
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.45,
"throughput_tps": 128.36,
"performance_tested_at": "2025-08-04T09:03:33.464Z"
},
{
"provider": "cerebras",
"status": "live",
"pricing": {
"input": 0.85,
"output": 1.2
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 15.09,
"throughput_tps": 3.91,
"performance_tested_at": "2025-08-04T09:03:48.106Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 0.66,
"throughput_tps": 86.78,
"performance_tested_at": "2025-08-04T09:03:33.669Z"
},
{
"provider": "together",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.88,
"output": 0.88
},
"supports_tools": true,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 0.56,
"throughput_tps": 103.62,
"performance_tested_at": "2025-08-04T09:03:33.572Z"
},
{
"provider": "groq",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.59,
"output": 0.79
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.3,
"throughput_tps": 195.82,
"performance_tested_at": "2025-08-04T09:04:04.311Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 1.19,
"throughput_tps": 29.32,
"performance_tested_at": "2025-08-04T09:04:05.208Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 1.04,
"throughput_tps": 58.74,
"performance_tested_at": "2025-08-04T09:04:05.053Z"
},
{
"provider": "sambanova",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.6,
"output": 1.2
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.47,
"throughput_tps": 128.28,
"performance_tested_at": "2025-08-04T09:04:04.482Z"
}
]
},
{
"id": "google/gemma-2-2b-it",
"object": "model",
"created": 1721127099,
"owned_by": "google",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.02,
"output": 0.06
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.38,
"throughput_tps": 107.92,
"performance_tested_at": "2025-08-04T09:04:04.394Z"
}
]
},
{
"id": "zai-org/GLM-4-32B-0414",
"object": "model",
"created": 1744030421,
"owned_by": "zai-org",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 32000,
"pricing": {
"input": 0.24,
"output": 0.24
},
"supports_tools": false,
"supports_structured_output": true,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 1.09,
"throughput_tps": 27.53,
"performance_tested_at": "2025-08-04T09:04:05.104Z"
},
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "HTTP 503 Service Temporarily Unavailable",
"performance_tested_at": "2025-08-04T09:04:18.588Z"
}
]
},
{
"id": "Qwen/Qwen3-4B",
"object": "model",
"created": 1745725289,
"owned_by": "Qwen",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.08,
"output": 0.24
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 1.3,
"throughput_tps": 135.55,
"performance_tested_at": "2025-08-04T09:04:05.313Z"
}
]
},
{
"id": "meta-llama/Llama-4-Scout-17B-16E-Instruct",
"object": "model",
"created": 1743600857,
"owned_by": "meta-llama",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.1,
"output": 0.5
},
"supports_tools": false,
"supports_structured_output": false,
"supports_function_calling": true,
"latency_s": 0.81,
"throughput_tps": 40.59,
"performance_tested_at": "2025-08-04T09:04:04.828Z"
},
{
"provider": "cerebras",
"status": "live",
"pricing": {
"input": 0.65,
"output": 0.85
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.4,
"throughput_tps": 88.53,
"performance_tested_at": "2025-08-04T09:04:04.410Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 0.61,
"throughput_tps": 52.16,
"performance_tested_at": "2025-08-04T09:04:04.628Z"
},
{
"provider": "together",
"status": "live",
"context_length": 1048576,
"pricing": {
"input": 0.18000000000000002,
"output": 0.5900000000000001
},
"supports_tools": true,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 0.34,
"throughput_tps": 95.75,
"performance_tested_at": "2025-08-04T09:04:04.359Z"
},
{
"provider": "groq",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.11,
"output": 0.34
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.26,
"throughput_tps": 132.65,
"performance_tested_at": "2025-08-04T09:04:04.271Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.61,
"throughput_tps": 56.17,
"performance_tested_at": "2025-08-04T09:04:04.620Z"
}
]
},
{
"id": "meta-llama/Llama-3.2-1B-Instruct",
"object": "model",
"created": 1726672367,
"owned_by": "meta-llama",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 131000,
"supports_tools": false,
"supports_structured_output": false,
"pricing": {
"input": 0,
"output": 0
},
"latency_s": 1.85,
"throughput_tps": 39.99,
"performance_tested_at": "2025-08-04T09:04:05.865Z"
}
]
},
{
"id": "Qwen/Qwen2.5-7B-Instruct",
"object": "model",
"created": 1726487740,
"owned_by": "Qwen",
"providers": [
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 4.79,
"throughput_tps": 5.84,
"performance_tested_at": "2025-08-04T09:04:08.809Z"
},
{
"provider": "together",
"status": "live",
"context_length": 32768,
"pricing": {
"input": 0.3,
"output": 0.3
},
"supports_tools": true,
"supports_structured_output": false,
"supports_stop_sequences": true,
"latency_s": 0.41,
"throughput_tps": 136.18,
"performance_tested_at": "2025-08-04T09:04:04.426Z"
}
]
},
{
"id": "Qwen/Qwen3-14B",
"object": "model",
"created": 1745725365,
"owned_by": "Qwen",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.08,
"output": 0.24
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 10.15,
"throughput_tps": 68.28,
"performance_tested_at": "2025-08-04T09:04:14.164Z"
},
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "HTTP 503 Service Temporarily Unavailable",
"performance_tested_at": "2025-08-04T09:04:19.084Z"
}
]
},
{
"id": "baidu/ERNIE-4.5-21B-A3B-PT",
"object": "model",
"created": 1751091210,
"owned_by": "baidu",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 120000,
"pricing": {
"input": 0.07,
"output": 0.28
},
"supports_tools": false,
"supports_structured_output": false,
"supports_function_calling": true,
"latency_s": 1.31,
"throughput_tps": 27.4,
"performance_tested_at": "2025-08-04T09:04:05.328Z"
}
]
},
{
"id": "meta-llama/Llama-3.1-70B-Instruct",
"object": "model",
"created": 1721146066,
"owned_by": "meta-llama",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.13,
"output": 0.4
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.58,
"throughput_tps": 54.96,
"performance_tested_at": "2025-08-04T09:04:20.668Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 0.78,
"throughput_tps": 47.23,
"performance_tested_at": "2025-08-04T09:04:20.869Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 1.18,
"throughput_tps": 28.87,
"performance_tested_at": "2025-08-04T09:04:21.263Z"
}
]
},
{
"id": "baidu/ERNIE-4.5-VL-28B-A3B-PT",
"object": "model",
"created": 1751089833,
"owned_by": "baidu",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 30000,
"pricing": {
"input": 0.14,
"output": 0.56
},
"supports_tools": false,
"supports_structured_output": false,
"supports_function_calling": true,
"latency_s": 1.08,
"throughput_tps": 36.93,
"performance_tested_at": "2025-08-04T09:04:21.169Z"
}
]
},
{
"id": "Qwen/Qwen2.5-Coder-32B-Instruct",
"object": "model",
"created": 1730879390,
"owned_by": "Qwen",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.1,
"output": 0.3
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 1.05,
"throughput_tps": 53.37,
"performance_tested_at": "2025-08-04T09:04:21.135Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 6.82,
"throughput_tps": 4.1,
"performance_tested_at": "2025-08-04T09:04:26.911Z"
},
{
"provider": "together",
"status": "live",
"context_length": 16384,
"pricing": {
"input": 0.8,
"output": 0.8
},
"supports_tools": true,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 0.45,
"throughput_tps": 121.89,
"performance_tested_at": "2025-08-04T09:04:20.537Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 1.09,
"throughput_tps": 32.12,
"performance_tested_at": "2025-08-04T09:04:21.175Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.91,
"throughput_tps": 60.36,
"performance_tested_at": "2025-08-04T09:04:20.997Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B",
"object": "model",
"created": 1737364574,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:04:50.087Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 4.11,
"throughput_tps": 73.52,
"performance_tested_at": "2025-08-04T09:04:24.193Z"
}
]
},
{
"id": "google/gemma-2-9b-it",
"object": "model",
"created": 1719216341,
"owned_by": "google",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.03,
"output": 0.09
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.98,
"throughput_tps": 41.96,
"performance_tested_at": "2025-08-04T09:04:21.063Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 7.92,
"throughput_tps": 3.91,
"performance_tested_at": "2025-08-04T09:04:28.009Z"
},
{
"provider": "groq",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.2,
"output": 0.2
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.4,
"throughput_tps": 92.08,
"performance_tested_at": "2025-08-04T09:04:20.488Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-V3",
"object": "model",
"created": 1735131143,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 64000,
"pricing": {
"input": 0.4,
"output": 1.3
},
"supports_tools": true,
"supports_structured_output": false,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 1.69,
"throughput_tps": 23.1,
"performance_tested_at": "2025-08-04T09:04:21.774Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 163840,
"pricing": {
"input": 0.5,
"output": 1.5
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.62,
"throughput_tps": 46.9,
"performance_tested_at": "2025-08-04T09:04:20.704Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 0.74,
"throughput_tps": 79.62,
"performance_tested_at": "2025-08-04T09:04:20.827Z"
},
{
"provider": "together",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 1.25,
"output": 1.25
},
"supports_tools": true,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 2.79,
"throughput_tps": 14.32,
"performance_tested_at": "2025-08-04T09:04:22.880Z"
}
]
},
{
"id": "CohereLabs/aya-vision-8b",
"object": "model",
"created": 1740938806,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.97,
"throughput_tps": 71.32,
"performance_tested_at": "2025-08-04T09:04:21.053Z"
}
]
},
{
"id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct",
"object": "model",
"created": 1743545840,
"owned_by": "meta-llama",
"providers": [
{
"provider": "cerebras",
"status": "live",
"pricing": {
"input": 0.2,
"output": 0.6
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.42,
"throughput_tps": 79.35,
"performance_tested_at": "2025-08-04T09:04:20.502Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 0.53,
"throughput_tps": 66.2,
"performance_tested_at": "2025-08-04T09:04:51.617Z"
},
{
"provider": "groq",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.2,
"output": 0.6
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.3,
"throughput_tps": 108.71,
"performance_tested_at": "2025-08-04T09:04:51.392Z"
},
{
"provider": "sambanova",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.63,
"output": 1.8
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.53,
"throughput_tps": 191.12,
"performance_tested_at": "2025-08-04T09:04:51.616Z"
}
]
},
{
"id": "MiniMaxAI/MiniMax-M1-80k",
"object": "model",
"created": 1749802874,
"owned_by": "MiniMaxAI",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 1000000,
"pricing": {
"input": 0.55,
"output": 2.2
},
"supports_tools": false,
"supports_structured_output": false,
"supports_function_calling": true,
"latency_s": 21.58,
"throughput_tps": 45.27,
"performance_tested_at": "2025-08-04T09:05:12.669Z"
}
]
},
{
"id": "CohereLabs/aya-expanse-8b",
"object": "model",
"created": 1729665253,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.71,
"throughput_tps": 105.19,
"performance_tested_at": "2025-08-04T09:04:51.801Z"
}
]
},
{
"id": "Qwen/Qwen2.5-Coder-7B-Instruct",
"object": "model",
"created": 1726580329,
"owned_by": "Qwen",
"providers": [
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "HTTP 503 Service Temporarily Unavailable",
"performance_tested_at": "2025-08-04T09:05:07.614Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.85,
"throughput_tps": 63.37,
"performance_tested_at": "2025-08-04T09:04:51.940Z"
}
]
},
{
"id": "CohereLabs/c4ai-command-a-03-2025",
"object": "model",
"created": 1741684205,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.58,
"throughput_tps": 96.87,
"performance_tested_at": "2025-08-04T09:04:51.666Z"
}
]
},
{
"id": "Qwen/Qwen2.5-Coder-3B-Instruct",
"object": "model",
"created": 1730879378,
"owned_by": "Qwen",
"providers": [
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.79,
"throughput_tps": 68.71,
"performance_tested_at": "2025-08-04T09:04:51.874Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
"object": "model",
"created": 1737364413,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 32000,
"pricing": {
"input": 0.8,
"output": 0.8
},
"supports_tools": false,
"supports_structured_output": false,
"supports_response_format": true,
"latency_s": 18.11,
"throughput_tps": 31.42,
"performance_tested_at": "2025-08-04T09:05:09.196Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.25,
"output": 0.75
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 3.35,
"throughput_tps": 56.96,
"performance_tested_at": "2025-08-04T09:04:54.442Z"
},
{
"provider": "cerebras",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.67,
"throughput_tps": 533.14,
"performance_tested_at": "2025-08-04T09:04:51.756Z"
},
{
"provider": "groq",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.75,
"output": 0.99
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 1.15,
"throughput_tps": 184.17,
"performance_tested_at": "2025-08-04T09:04:52.239Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 16.44,
"throughput_tps": 24.7,
"performance_tested_at": "2025-08-04T09:05:07.527Z"
},
{
"provider": "sambanova",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.7,
"output": 1.4
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 4.13,
"throughput_tps": 152.64,
"performance_tested_at": "2025-08-04T09:04:55.228Z"
}
]
},
{
"id": "Qwen/Qwen3-235B-A22B",
"object": "model",
"created": 1745726026,
"owned_by": "Qwen",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.2,
"output": 0.8
},
"supports_tools": false,
"supports_structured_output": false,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 3.49,
"throughput_tps": 11.74,
"performance_tested_at": "2025-08-04T09:04:54.579Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.2,
"output": 0.6
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 25.47,
"throughput_tps": 24.38,
"performance_tested_at": "2025-08-04T09:05:16.561Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 10.41,
"throughput_tps": 85.4,
"performance_tested_at": "2025-08-04T09:05:01.498Z"
},
{
"provider": "together",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.2,
"output": 0.6
},
"supports_tools": true,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 9.38,
"throughput_tps": 39.23,
"performance_tested_at": "2025-08-04T09:05:00.469Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 14.06,
"throughput_tps": 32.36,
"performance_tested_at": "2025-08-04T09:05:05.147Z"
}
]
},
{
"id": "aaditya/Llama3-OpenBioLLM-70B",
"object": "model",
"created": 1713925272,
"owned_by": "aaditya",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.13,
"output": 0.4
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.62,
"throughput_tps": 53.54,
"performance_tested_at": "2025-08-04T09:05:18.179Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B",
"object": "model",
"created": 1737364182,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 32000,
"pricing": {
"input": 0.04,
"output": 0.04
},
"supports_tools": false,
"supports_structured_output": true,
"supports_response_format": true,
"latency_s": 18.76,
"throughput_tps": 34,
"performance_tested_at": "2025-08-04T09:05:36.326Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 8.69,
"throughput_tps": 3.91,
"performance_tested_at": "2025-08-04T09:05:26.250Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 5.76,
"throughput_tps": 70.16,
"performance_tested_at": "2025-08-04T09:05:23.321Z"
}
]
},
{
"id": "microsoft/phi-4",
"object": "model",
"created": 1733917649,
"owned_by": "microsoft",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 16384,
"pricing": {
"input": 0.1,
"output": 0.3
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.47,
"throughput_tps": 65.45,
"performance_tested_at": "2025-08-04T09:05:18.036Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
"object": "model",
"created": 1737364740,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 64000,
"pricing": {
"input": 0.3,
"output": 0.3
},
"supports_tools": false,
"supports_structured_output": true,
"supports_response_format": true,
"latency_s": 4.01,
"throughput_tps": 43.93,
"performance_tested_at": "2025-08-04T09:05:21.569Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 15.95,
"throughput_tps": 28.39,
"performance_tested_at": "2025-08-04T09:05:33.516Z"
}
]
},
{
"id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1",
"object": "model",
"created": 1744051630,
"owned_by": "nvidia",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.6,
"output": 1.8
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 3.78,
"throughput_tps": 46.3,
"performance_tested_at": "2025-08-04T09:05:21.342Z"
}
]
},
{
"id": "meta-llama/Meta-Llama-3-70B-Instruct",
"object": "model",
"created": 1713346494,
"owned_by": "meta-llama",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.51,
"output": 0.74
},
"supports_tools": false,
"supports_structured_output": true,
"supports_function_calling": true,
"supports_response_format": true,
"latency_s": 1.46,
"throughput_tps": 24.04,
"performance_tested_at": "2025-08-04T09:05:19.018Z"
},
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:05:47.564Z"
},
{
"provider": "together",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.88,
"output": 0.88
},
"supports_tools": false,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 0.48,
"throughput_tps": 73.58,
"performance_tested_at": "2025-08-04T09:05:18.038Z"
},
{
"provider": "groq",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.59,
"output": 0.79
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.47,
"throughput_tps": 71.77,
"performance_tested_at": "2025-08-04T09:05:18.036Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.88,
"throughput_tps": 36.54,
"performance_tested_at": "2025-08-04T09:05:18.439Z"
}
]
},
{
"id": "Sao10K/L3-8B-Stheno-v3.2",
"object": "model",
"created": 1717583457,
"owned_by": "Sao10K",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.05,
"output": 0.05
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.81,
"throughput_tps": 49.44,
"performance_tested_at": "2025-08-04T09:05:18.372Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 6.37,
"throughput_tps": 4.39,
"performance_tested_at": "2025-08-04T09:05:23.934Z"
}
]
},
{
"id": "CohereLabs/c4ai-command-r-plus",
"object": "model",
"created": 1712150824,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.47,
"throughput_tps": 54.88,
"performance_tested_at": "2025-08-04T09:05:18.037Z"
}
]
},
{
"id": "baidu/ERNIE-4.5-300B-A47B-Base-PT",
"object": "model",
"created": 1751089026,
"owned_by": "baidu",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 123000,
"pricing": {
"input": 0.28,
"output": 1.1
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 1.22,
"throughput_tps": 22.05,
"performance_tested_at": "2025-08-04T09:05:18.787Z"
}
]
},
{
"id": "Qwen/Qwen2.5-VL-32B-Instruct",
"object": "model",
"created": 1742570595,
"owned_by": "Qwen",
"providers": [
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 1.7,
"throughput_tps": 68.1,
"performance_tested_at": "2025-08-04T09:05:19.266Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
"object": "model",
"created": 1737364707,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 64000,
"pricing": {
"input": 0.15,
"output": 0.15
},
"supports_tools": false,
"supports_structured_output": true,
"supports_response_format": true,
"latency_s": 13.62,
"throughput_tps": 45.15,
"performance_tested_at": "2025-08-04T09:05:31.183Z"
},
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:05:47.564Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 15.28,
"throughput_tps": 40.19,
"performance_tested_at": "2025-08-04T09:06:03.844Z"
}
]
},
{
"id": "CohereLabs/aya-expanse-32b",
"object": "model",
"created": 1729665764,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.9,
"throughput_tps": 79.7,
"performance_tested_at": "2025-08-04T09:05:49.469Z"
}
]
},
{
"id": "baidu/ERNIE-4.5-0.3B-PT",
"object": "model",
"created": 1751091102,
"owned_by": "baidu",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 120000,
"supports_tools": false,
"supports_structured_output": false,
"pricing": {
"input": 0,
"output": 0
},
"supports_function_calling": true,
"latency_s": 1.9,
"throughput_tps": 18.43,
"performance_tested_at": "2025-08-04T09:05:50.465Z"
}
]
},
{
"id": "Qwen/Qwen2.5-72B-Instruct",
"object": "model",
"created": 1726487791,
"owned_by": "Qwen",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 32000,
"pricing": {
"input": 0.38,
"output": 0.4
},
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.71,
"throughput_tps": 78.41,
"performance_tested_at": "2025-08-04T09:05:49.280Z"
},
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.25,
"output": 0.75
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.43,
"throughput_tps": 123.79,
"performance_tested_at": "2025-08-04T09:05:48.994Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 20.56,
"throughput_tps": 1.41,
"performance_tested_at": "2025-08-04T09:06:09.123Z"
},
{
"provider": "together",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 1.2,
"output": 1.2
},
"supports_tools": true,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 1.39,
"throughput_tps": 40.24,
"performance_tested_at": "2025-08-04T09:05:49.957Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 1.45,
"throughput_tps": 24.06,
"performance_tested_at": "2025-08-04T09:05:50.021Z"
}
]
},
{
"id": "meta-llama/Llama-3.1-405B-Instruct",
"object": "model",
"created": 1721154284,
"owned_by": "meta-llama",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 1,
"output": 3
},
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.58,
"throughput_tps": 100.83,
"performance_tested_at": "2025-08-04T09:05:49.141Z"
},
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 0.5,
"throughput_tps": 80.11,
"performance_tested_at": "2025-08-04T09:05:49.065Z"
},
{
"provider": "sambanova",
"status": "live",
"supports_tools": true,
"supports_structured_output": true,
"latency_s": 0.71,
"throughput_tps": 80.75,
"performance_tested_at": "2025-08-04T09:05:49.272Z"
}
]
},
{
"id": "Qwen/Qwen3-235B-A22B-FP8",
"object": "model",
"created": 1745850968,
"owned_by": "Qwen",
"providers": [
{
"provider": "together",
"status": "live",
"context_length": 40960,
"pricing": {
"input": 0.2,
"output": 0.6
},
"supports_tools": true,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 19.92,
"throughput_tps": 37.15,
"performance_tested_at": "2025-08-04T09:06:08.483Z"
}
]
},
{
"id": "baidu/ERNIE-4.5-VL-424B-A47B-Base-PT",
"object": "model",
"created": 1751089776,
"owned_by": "baidu",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 123000,
"pricing": {
"input": 0.42,
"output": 1.25
},
"supports_tools": false,
"supports_structured_output": false,
"supports_function_calling": true,
"latency_s": 4.24,
"throughput_tps": 17.43,
"performance_tested_at": "2025-08-04T09:05:52.811Z"
}
]
},
{
"id": "Qwen/Qwen2-VL-72B-Instruct",
"object": "model",
"created": 1726547134,
"owned_by": "Qwen",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 32768,
"pricing": {
"input": 0.13,
"output": 0.4
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.78,
"throughput_tps": 57.62,
"performance_tested_at": "2025-08-04T09:05:49.347Z"
}
]
},
{
"id": "Qwen/Qwen2.5-Coder-7B",
"object": "model",
"created": 1726487844,
"owned_by": "Qwen",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 32768,
"pricing": {
"input": 0.03,
"output": 0.09
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.34,
"throughput_tps": 157.48,
"performance_tested_at": "2025-08-04T09:05:48.909Z"
},
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:06:18.567Z"
}
]
},
{
"id": "CohereLabs/aya-vision-32b",
"object": "model",
"created": 1740951400,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 1.65,
"throughput_tps": 61.32,
"performance_tested_at": "2025-08-04T09:05:50.213Z"
}
]
},
{
"id": "CohereLabs/c4ai-command-r7b-arabic-02-2025",
"object": "model",
"created": 1740643869,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.38,
"throughput_tps": 71.48,
"performance_tested_at": "2025-08-04T09:05:48.944Z"
}
]
},
{
"id": "Qwen/Qwen2.5-VL-72B-Instruct",
"object": "model",
"created": 1737951124,
"owned_by": "Qwen",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 32000,
"pricing": {
"input": 0.25,
"output": 0.75
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.84,
"throughput_tps": 54.47,
"performance_tested_at": "2025-08-04T09:05:49.411Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 2.01,
"throughput_tps": 22.44,
"performance_tested_at": "2025-08-04T09:05:50.571Z"
}
]
},
{
"id": "NousResearch/Hermes-2-Pro-Llama-3-8B",
"object": "model",
"created": 1714436178,
"owned_by": "NousResearch",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.14,
"output": 0.14
},
"supports_tools": false,
"supports_structured_output": false,
"supports_response_format": true,
"latency_s": 0.88,
"throughput_tps": 36.33,
"performance_tested_at": "2025-08-04T09:06:20.450Z"
}
]
},
{
"id": "Qwen/QwQ-32B",
"object": "model",
"created": 1741184219,
"owned_by": "Qwen",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.5,
"output": 1.5
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 5.45,
"throughput_tps": 84.72,
"performance_tested_at": "2025-08-04T09:06:25.022Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 20.12,
"throughput_tps": 7.75,
"performance_tested_at": "2025-08-04T09:06:39.689Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 3.11,
"throughput_tps": 100.76,
"performance_tested_at": "2025-08-04T09:06:22.676Z"
},
{
"provider": "nscale",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 9.71,
"throughput_tps": 29.35,
"performance_tested_at": "2025-08-04T09:06:29.281Z"
}
]
},
{
"id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
"object": "model",
"created": 1743540422,
"owned_by": "meta-llama",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 1048576,
"pricing": {
"input": 0.17,
"output": 0.85
},
"supports_tools": true,
"supports_structured_output": false,
"supports_function_calling": true,
"latency_s": 0.74,
"throughput_tps": 45.65,
"performance_tested_at": "2025-08-04T09:06:20.314Z"
},
{
"provider": "together",
"status": "live",
"context_length": 1048576,
"pricing": {
"input": 0.27,
"output": 0.85
},
"supports_tools": true,
"supports_structured_output": false,
"supports_stop_sequences": true,
"latency_s": 0.45,
"throughput_tps": 76.02,
"performance_tested_at": "2025-08-04T09:06:20.017Z"
}
]
},
{
"id": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
"object": "model",
"created": 1704953687,
"owned_by": "NousResearch",
"providers": [
{
"provider": "together",
"status": "live",
"context_length": 32768,
"pricing": {
"input": 0.6,
"output": 0.6
},
"supports_tools": false,
"supports_structured_output": false,
"supports_stop_sequences": true,
"latency_s": 0.96,
"throughput_tps": 40.47,
"performance_tested_at": "2025-08-04T09:06:20.533Z"
}
]
},
{
"id": "Sao10K/L3-70B-Euryale-v2.1",
"object": "model",
"created": 1718134069,
"owned_by": "Sao10K",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 1.48,
"output": 1.48
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.92,
"throughput_tps": 37.01,
"performance_tested_at": "2025-08-04T09:06:20.488Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 11.41,
"throughput_tps": 2.45,
"performance_tested_at": "2025-08-04T09:06:30.977Z"
}
]
},
{
"id": "Qwen/QwQ-32B-Preview",
"object": "model",
"created": 1732722655,
"owned_by": "Qwen",
"providers": [
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 7.21,
"throughput_tps": 4.16,
"performance_tested_at": "2025-08-04T09:06:26.777Z"
},
{
"provider": "together",
"status": "live",
"supports_tools": true,
"supports_structured_output": true,
"pricing": {
"input": 65,
"output": 0
},
"context_length": 32768,
"supports_stop_sequences": true,
"latency_s": 2.93,
"throughput_tps": 97.22,
"performance_tested_at": "2025-08-04T09:06:22.501Z"
}
]
},
{
"id": "deepseek-ai/DeepSeek-Prover-V2-671B",
"object": "model",
"created": 1745993675,
"owned_by": "deepseek-ai",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 160000,
"pricing": {
"input": 0.7,
"output": 2.5
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 1.87,
"throughput_tps": 21.37,
"performance_tested_at": "2025-08-04T09:06:21.441Z"
}
]
},
{
"id": "marin-community/marin-8b-instruct",
"object": "model",
"created": 1747241066,
"owned_by": "marin-community",
"providers": [
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 7.63,
"throughput_tps": 3.67,
"performance_tested_at": "2025-08-04T09:06:27.201Z"
},
{
"provider": "together",
"status": "live",
"context_length": 4096,
"pricing": {
"input": 0.18000000000000002,
"output": 0.18000000000000002
},
"supports_tools": false,
"supports_structured_output": true,
"supports_stop_sequences": true,
"latency_s": 0.62,
"throughput_tps": 693.1,
"performance_tested_at": "2025-08-04T09:06:20.185Z"
}
]
},
{
"id": "SentientAGI/Dobby-Unhinged-Llama-3.3-70B",
"object": "model",
"created": 1739304442,
"owned_by": "SentientAGI",
"providers": [
{
"provider": "fireworks-ai",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"context_length": 163840,
"supports_image_input": false,
"supports_function_calling": false,
"latency_s": 1.03,
"throughput_tps": 72.04,
"performance_tested_at": "2025-08-04T09:06:20.597Z"
}
]
},
{
"id": "NousResearch/Hermes-3-Llama-3.1-405B",
"object": "model",
"created": 1723525073,
"owned_by": "NousResearch",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 1,
"output": 3
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 4.41,
"throughput_tps": 32.23,
"performance_tested_at": "2025-08-04T09:06:23.975Z"
}
]
},
{
"id": "alpindale/WizardLM-2-8x22B",
"object": "model",
"created": 1713235019,
"owned_by": "alpindale",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 65535,
"pricing": {
"input": 0.62,
"output": 0.62
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 4.41,
"throughput_tps": 23.38,
"performance_tested_at": "2025-08-04T09:06:23.975Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 4.02,
"throughput_tps": 11.94,
"performance_tested_at": "2025-08-04T09:06:23.589Z"
}
]
},
{
"id": "meta-llama/Llama-Guard-4-12B",
"object": "model",
"created": 1745407825,
"owned_by": "meta-llama",
"providers": [
{
"provider": "groq",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.2,
"output": 0.2
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 0.39,
"throughput_tps": 557.65,
"performance_tested_at": "2025-08-04T09:06:19.959Z"
}
]
},
{
"id": "Qwen/Qwen2.5-32B-Instruct",
"object": "model",
"created": 1726546675,
"owned_by": "Qwen",
"providers": [
{
"provider": "nebius",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.13,
"output": 0.4
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 0.37,
"throughput_tps": 150.33,
"performance_tested_at": "2025-08-04T09:06:41.063Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 7.41,
"throughput_tps": 3.92,
"performance_tested_at": "2025-08-04T09:06:48.097Z"
}
]
},
{
"id": "dphn/dolphin-2.9.2-mixtral-8x22b",
"object": "model",
"created": 1716934597,
"owned_by": "dphn",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 16000,
"pricing": {
"input": 0.9,
"output": 0.9
},
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 3.73,
"throughput_tps": 25.48,
"performance_tested_at": "2025-08-04T09:06:44.419Z"
}
]
},
{
"id": "Qwen/Qwen2-72B-Instruct",
"object": "model",
"created": 1716868129,
"owned_by": "Qwen",
"providers": [
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:07:10.691Z"
},
{
"provider": "together",
"status": "live",
"context_length": 32768,
"pricing": {
"input": 0.9,
"output": 0.9
},
"supports_tools": false,
"supports_structured_output": false,
"supports_stop_sequences": true,
"latency_s": 0.68,
"throughput_tps": 64.82,
"performance_tested_at": "2025-08-04T09:06:41.369Z"
}
]
},
{
"id": "NousResearch/Hermes-3-Llama-3.1-70B",
"object": "model",
"created": 1722263277,
"owned_by": "NousResearch",
"providers": [
{
"provider": "featherless-ai",
"status": "offline",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"performance_error": "Request timeout",
"performance_tested_at": "2025-08-04T09:07:10.691Z"
},
{
"provider": "hyperbolic",
"status": "live",
"supports_tools": false,
"supports_structured_output": false,
"latency_s": 26.93,
"throughput_tps": 4.35,
"performance_tested_at": "2025-08-04T09:07:07.615Z"
}
]
},
{
"id": "Sao10K/L3-8B-Lunaris-v1",
"object": "model",
"created": 1719362412,
"owned_by": "Sao10K",
"providers": [
{
"provider": "novita",
"status": "live",
"context_length": 8192,
"pricing": {
"input": 0.05,
"output": 0.05
},
"supports_tools": false,
"supports_structured_output": false,
"supports_response_format": true,
"latency_s": 1.01,
"throughput_tps": 32.63,
"performance_tested_at": "2025-08-04T09:06:41.702Z"
},
{
"provider": "featherless-ai",
"status": "live",
"pricing": {
"input": 0.1,
"output": 0.1
},
"context_length": 16384,
"latency_s": 8.55,
"throughput_tps": 3.51,
"performance_tested_at": "2025-08-04T09:06:49.238Z"
}
]
},
{
"id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",
"object": "model",
"created": 1728700633,
"owned_by": "nvidia",
"providers": [
{
"provider": "together",
"status": "live",
"context_length": 32768,
"pricing": {
"input": 0.88,
"output": 0.88
},
"supports_tools": true,
"supports_structured_output": false,
"supports_stop_sequences": true,
"latency_s": 1.43,
"throughput_tps": 74.25,
"performance_tested_at": "2025-08-04T09:06:42.118Z"
}
]
},
{
"id": "CohereLabs/c4ai-command-r-v01",
"object": "model",
"created": 1710172254,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.72,
"throughput_tps": 109.72,
"performance_tested_at": "2025-08-04T09:06:41.410Z"
}
]
},
{
"id": "tokyotech-llm/Llama-3.3-Swallow-70B-Instruct-v0.4",
"object": "model",
"created": 1740976430,
"owned_by": "tokyotech-llm",
"providers": [
{
"provider": "sambanova",
"status": "live",
"context_length": 131072,
"pricing": {
"input": 0.6,
"output": 1.2
},
"supports_tools": false,
"supports_structured_output": true,
"latency_s": 2.99,
"throughput_tps": 11.36,
"performance_tested_at": "2025-08-04T09:06:43.683Z"
}
]
},
{
"id": "CohereLabs/c4ai-command-r-08-2024",
"object": "model",
"created": 1724053211,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.44,
"throughput_tps": 59.12,
"performance_tested_at": "2025-08-04T09:06:41.130Z"
}
]
},
{
"id": "CohereLabs/c4ai-command-r7b-12-2024",
"object": "model",
"created": 1733932505,
"owned_by": "CohereLabs",
"providers": [
{
"provider": "cohere",
"status": "live",
"supports_tools": true,
"supports_structured_output": false,
"latency_s": 0.32,
"throughput_tps": 77.16,
"performance_tested_at": "2025-08-04T09:06:41.014Z"
}
]
}
],
"generated_at": "2025-08-04T09:07:10.692Z",
"metadata": {
"total_models": 91,
"models_enriched": 75,
"providers_enriched": 145,
"performance_tested": true,
"providers_fetched": {
"novita": 52,
"sambanova": 10,
"groq": 21,
"featherless": 5748,
"together": 90,
"cohere": 0,
"fireworks": 32,
"nebius": 0,
"hyperbolic": 0,
"cerebras": 0,
"nscale": 0
}
}
}