{
"service": "InferenceLatency.com",
"endpoint": "/reliability-metrics",
"timestamp": "2026-03-01T22:50:46.126196Z",
"provider_reliability": {
"OpenAI": {
"current_performance": {
"latency_ms": 614,
"model": "GPT-4o",
"status": "operational"
},
"percentile_analysis": {
"p50": 467,
"p95": 1226,
"p99": 4957,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 7,
"mean_time_to_respond": 879.0
},
"quality_grade": "A+"
},
"Groq": {
"current_performance": {
"latency_ms": 1197,
"model": "llama-3.1-8b-instant",
"status": "operational"
},
"percentile_analysis": {
"p50": 2117,
"p95": 17236,
"p99": 26443,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 7,
"mean_time_to_respond": 1214.57
},
"quality_grade": "A+"
},
"Claude": {
"current_performance": {
"latency_ms": 1011,
"model": "Claude Sonnet 4",
"status": "operational"
},
"percentile_analysis": {
"p50": 1143,
"p95": 2444,
"p99": 4595,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 7,
"mean_time_to_respond": 1026.29
},
"quality_grade": "A+"
},
"OpenRouter": {
"current_performance": {
"latency_ms": 419,
"model": "Mistral",
"status": "operational"
},
"percentile_analysis": {
"p50": 1019,
"p95": 16538,
"p99": 24985,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 100.0,
"error_rate_percent": 0.0,
"sla_compliance_percent": 100.0,
"requests_24h": 7,
"mean_time_to_respond": 526.43
},
"quality_grade": "A+"
},
"Together AI": {
"current_performance": {
"latency_ms": 217,
"model": "Llama3.1-8B-Turbo",
"status": "operational"
},
"percentile_analysis": {
"p50": 406,
"p95": 20439,
"p99": 32963,
"sample_size": 100
},
"reliability_metrics": {
"availability_percent": 85.71,
"error_rate_percent": 14.29,
"sla_compliance_percent": 85.71,
"requests_24h": 7,
"mean_time_to_respond": 244.83
},
"quality_grade": "D"
}
},
"platform_summary": {
"overall_availability_percent": 97.14,
"overall_sla_compliance_percent": 97.14,
"total_providers_analyzed": 5,
"grade_distribution": {
"A+": 4,
"A": 0,
"B": 0,
"C": 0,
"D": 1
}
},
"sla_targets": {
"availability_target": "99.5%",
"latency_target": "95% of requests under 2000ms",
"error_rate_target": "< 0.5%"
},
"methodology": {
"data_window": "24 hours",
"percentile_calculations": "Based on last 100 successful requests",
"grading_criteria": "Industry-standard SLA benchmarks"
}
}