{
"service": "InferenceLatency.com",
"endpoint": "/reliability-metrics",
"timestamp": "2025-10-26T06:22:53.348098Z",
"provider_reliability": {
"OpenAI": {
"current_performance": {
"latency_ms": 1091,
"model": "GPT-4o",
"status": "operational"
},
"percentile_analysis": {
"p50": 466,
"p95": 1345,
"p99": 4957,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 88.89,
"requests_24h": 9,
"mean_time_to_respond": 850.67
},
"quality_grade": "C"
},
"Groq": {
"current_performance": {
"latency_ms": 2063,
"model": "llama-3.1-8b-instant",
"status": "operational"
},
"percentile_analysis": {
"p50": 2146,
"p95": 17236,
"p99": 26443,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 44.44,
"requests_24h": 9,
"mean_time_to_respond": 1608.11
},
"quality_grade": "D"
},
"Claude": {
"current_performance": {
"latency_ms": 1539,
"model": "Claude Sonnet 4",
"status": "operational"
},
"percentile_analysis": {
"p50": 1172,
"p95": 2444,
"p99": 4595,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 9,
"mean_time_to_respond": 1664.89
},
"quality_grade": "A+"
},
"OpenRouter": {
"current_performance": {
"latency_ms": 683,
"model": "Mistral",
"status": "operational"
},
"percentile_analysis": {
"p50": 1019,
"p95": 16538,
"p99": 24985,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 9,
"mean_time_to_respond": 682.0
},
"quality_grade": "A+"
},
"Google Gemini": {
"current_performance": {
"latency_ms": 351,
"model": "Gemini-2.0-Flash",
"status": "operational"
},
"percentile_analysis": {
"p50": 366,
"p95": 646,
"p99": 956,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 9,
"mean_time_to_respond": 346.0
},
"quality_grade": "A+"
},
"Together AI": {
"current_performance": {
"latency_ms": 189,
"model": "Llama3.1-8B-Turbo",
"status": "operational"
},
"percentile_analysis": {
"p50": 523,
"p95": 20439,
"p99": 32963,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 77.78,
"requests_24h": 9,
"mean_time_to_respond": 1423.11
},
"quality_grade": "D"
},
"Fireworks AI": {
"current_performance": {
"latency_ms": 222,
"model": "Llama3.1-8B",
"status": "operational"
},
"percentile_analysis": {
"p50": 477,
"p95": 20506,
"p99": 32993,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 9,
"mean_time_to_respond": 248.33
},
"quality_grade": "A+"
}
},
"platform_summary": {
"overall_availability_percent": 100.0,
"overall_sla_compliance_percent": 87.3,
"total_providers_analyzed": 7,
"grade_distribution": {
"A+": 4,
"A": 0,
"B": 0,
"C": 1,
"D": 2
}
},
"sla_targets": {
"availability_target": "99.5%",
"latency_target": "95% of requests under 2000ms",
"error_rate_target": "< 0.5%"
},
"methodology": {
"data_window": "24 hours",
"percentile_calculations": "Based on last 100 successful requests",
"grading_criteria": "Industry-standard SLA benchmarks"
}
}