{
"service": "InferenceLatency.com",
"endpoint": "/reliability-metrics",
"timestamp": "2026-04-16T01:10:06.391383Z",
"provider_reliability": {
"OpenAI": {
"current_performance": {
"latency_ms": 402,
"model": "GPT-4o",
"status": "operational"
},
"percentile_analysis": {
"p50": 455,
"p95": 1226,
"p99": 4957,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 10,
"mean_time_to_respond": 526.7
},
"quality_grade": "A+"
},
"Groq": {
"current_performance": {
"latency_ms": 1506,
"model": "llama-3.1-8b-instant",
"status": "operational"
},
"percentile_analysis": {
"p50": 2081,
"p95": 17236,
"p99": 26443,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 10,
"mean_time_to_respond": 1016.0
},
"quality_grade": "A+"
},
"Claude": {
"current_performance": {
"latency_ms": 1244,
"model": "Claude Sonnet 4",
"status": "operational"
},
"percentile_analysis": {
"p50": 1143,
"p95": 2444,
"p99": 4595,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 10,
"mean_time_to_respond": 1107.3
},
"quality_grade": "A+"
},
"OpenRouter": {
"current_performance": {
"latency_ms": 398,
"model": "Mistral",
"status": "operational"
},
"percentile_analysis": {
"p50": 1019,
"p95": 16538,
"p99": 24985,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 10,
"mean_time_to_respond": 309.1
},
"quality_grade": "A+"
}
},
"platform_summary": {
"overall_availability_percent": 100.0,
"overall_sla_compliance_percent": 100.0,
"total_providers_analyzed": 4,
"grade_distribution": {
"A+": 4,
"A": 0,
"B": 0,
"C": 0,
"D": 0
}
},
"sla_targets": {
"availability_target": "99.5%",
"latency_target": "95% of requests under 2000ms",
"error_rate_target": "< 0.5%"
},
"methodology": {
"data_window": "24 hours",
"percentile_calculations": "Based on last 100 successful requests",
"grading_criteria": "Industry-standard SLA benchmarks"
}
}