{
"service": "InferenceLatency.com",
"endpoint": "/reliability-metrics",
"timestamp": "2026-01-15T05:07:47.241494Z",
"provider_reliability": {
"OpenAI": {
"current_performance": {
"latency_ms": 363,
"model": "GPT-4o",
"status": "operational"
},
"percentile_analysis": {
"p50": 430,
"p95": 1226,
"p99": 4957,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 92.31,
"requests_24h": 13,
"mean_time_to_respond": 659.46
},
"quality_grade": "B"
},
"Groq": {
"current_performance": {
"latency_ms": 1752,
"model": "llama-3.1-8b-instant",
"status": "operational"
},
"percentile_analysis": {
"p50": 2117,
"p95": 17236,
"p99": 26443,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 92.31,
"requests_24h": 13,
"mean_time_to_respond": 1564.69
},
"quality_grade": "B"
},
"Claude": {
"current_performance": {
"latency_ms": 1576,
"model": "Claude Sonnet 4",
"status": "operational"
},
"percentile_analysis": {
"p50": 1194,
"p95": 2464,
"p99": 4595,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 92.31,
"requests_24h": 13,
"mean_time_to_respond": 1617.0
},
"quality_grade": "B"
},
"OpenRouter": {
"current_performance": {
"latency_ms": 286,
"model": "Mistral",
"status": "operational"
},
"percentile_analysis": {
"p50": 1074,
"p95": 16538,
"p99": 24985,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 84.62,
"requests_24h": 13,
"mean_time_to_respond": 1140.92
},
"quality_grade": "C"
},
"Together AI": {
"current_performance": {
"latency_ms": 466,
"model": "Llama3.1-8B-Turbo",
"status": "operational"
},
"percentile_analysis": {
"p50": 474,
"p95": 20439,
"p99": 32963,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 92.31,
"requests_24h": 13,
"mean_time_to_respond": 485.08
},
"quality_grade": "B"
}
},
"platform_summary": {
"overall_availability_percent": 100.0,
"overall_sla_compliance_percent": 90.77,
"total_providers_analyzed": 5,
"grade_distribution": {
"A+": 0,
"A": 0,
"B": 4,
"C": 1,
"D": 0
}
},
"sla_targets": {
"availability_target": "99.5%",
"latency_target": "95% of requests under 2000ms",
"error_rate_target": "< 0.5%"
},
"methodology": {
"data_window": "24 hours",
"percentile_calculations": "Based on last 100 successful requests",
"grading_criteria": "Industry-standard SLA benchmarks"
}
}