{
"service": "InferenceLatency.com",
"endpoint": "/reliability-metrics",
"timestamp": "2026-05-31T02:49:35.296276Z",
"provider_reliability": {
"OpenAI": {
"current_performance": {
"latency_ms": 516,
"model": "GPT-4o",
"status": "operational"
},
"percentile_analysis": {
"p50": 459,
"p95": 2153,
"p99": 4957,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 75.0,
"requests_24h": 8,
"mean_time_to_respond": 1037.5
},
"quality_grade": "D"
},
"Groq": {
"current_performance": {
"latency_ms": 1387,
"model": "llama-3.1-8b-instant",
"status": "operational"
},
"percentile_analysis": {
"p50": 2167,
"p95": 17236,
"p99": 26443,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 62.5,
"requests_24h": 8,
"mean_time_to_respond": 4792.75
},
"quality_grade": "D"
},
"Claude": {
"current_performance": {
"latency_ms": 819,
"model": "Claude Sonnet 4",
"status": "operational"
},
"percentile_analysis": {
"p50": 1143,
"p95": 2574,
"p99": 4595,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 8,
"mean_time_to_respond": 909.5
},
"quality_grade": "A+"
}
},
"platform_summary": {
"overall_availability_percent": 100.0,
"overall_sla_compliance_percent": 79.17,
"total_providers_analyzed": 3,
"grade_distribution": {
"A+": 1,
"A": 0,
"B": 0,
"C": 0,
"D": 2
}
},
"sla_targets": {
"availability_target": "99.5%",
"latency_target": "95% of requests under 2000ms",
"error_rate_target": "< 0.5%"
},
"methodology": {
"data_window": "24 hours",
"percentile_calculations": "Based on last 100 successful requests",
"grading_criteria": "Industry-standard SLA benchmarks"
}
}