📊 Reliability Metrics Analysis

← Back to Home

🔧 Reliability Analysis: 5 providers | 📊 Availability: 100.0% | ✅ SLA compliance: 90.77%
Full JSON Response (for developers & agents)
{
  "service": "InferenceLatency.com",
  "endpoint": "/reliability-metrics",
  "timestamp": "2026-01-15T05:07:47.241494Z",
  "provider_reliability": {
    "OpenAI": {
      "current_performance": {
        "latency_ms": 363,
        "model": "GPT-4o",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 430,
        "p95": 1226,
        "p99": 4957,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 100.0,
        "error_rate_percent": 0.0,
        "sla_compliance_percent": 92.31,
        "requests_24h": 13,
        "mean_time_to_respond": 659.46
      },
      "quality_grade": "B"
    },
    "Groq": {
      "current_performance": {
        "latency_ms": 1752,
        "model": "llama-3.1-8b-instant",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 2117,
        "p95": 17236,
        "p99": 26443,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 100.0,
        "error_rate_percent": 0.0,
        "sla_compliance_percent": 92.31,
        "requests_24h": 13,
        "mean_time_to_respond": 1564.69
      },
      "quality_grade": "B"
    },
    "Claude": {
      "current_performance": {
        "latency_ms": 1576,
        "model": "Claude Sonnet 4",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 1194,
        "p95": 2464,
        "p99": 4595,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 100.0,
        "error_rate_percent": 0.0,
        "sla_compliance_percent": 92.31,
        "requests_24h": 13,
        "mean_time_to_respond": 1617.0
      },
      "quality_grade": "B"
    },
    "OpenRouter": {
      "current_performance": {
        "latency_ms": 286,
        "model": "Mistral",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 1074,
        "p95": 16538,
        "p99": 24985,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 100.0,
        "error_rate_percent": 0.0,
        "sla_compliance_percent": 84.62,
        "requests_24h": 13,
        "mean_time_to_respond": 1140.92
      },
      "quality_grade": "C"
    },
    "Together AI": {
      "current_performance": {
        "latency_ms": 466,
        "model": "Llama3.1-8B-Turbo",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 474,
        "p95": 20439,
        "p99": 32963,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 100.0,
        "error_rate_percent": 0.0,
        "sla_compliance_percent": 92.31,
        "requests_24h": 13,
        "mean_time_to_respond": 485.08
      },
      "quality_grade": "B"
    }
  },
  "platform_summary": {
    "overall_availability_percent": 100.0,
    "overall_sla_compliance_percent": 90.77,
    "total_providers_analyzed": 5,
    "grade_distribution": {
      "A+": 0,
      "A": 0,
      "B": 4,
      "C": 1,
      "D": 0
    }
  },
  "sla_targets": {
    "availability_target": "99.5%",
    "latency_target": "95% of requests under 2000ms",
    "error_rate_target": "< 0.5%"
  },
  "methodology": {
    "data_window": "24 hours",
    "percentile_calculations": "Based on last 100 successful requests",
    "grading_criteria": "Industry-standard SLA benchmarks"
  }
}