📊 Reliability Metrics Analysis

← Back to Home

🔧 Reliability Analysis: 5 providers | 📊 Availability: 97.14% | ✅ SLA compliance: 97.14%
Full JSON Response (for developers & agents)
{
  "service": "InferenceLatency.com",
  "endpoint": "/reliability-metrics",
  "timestamp": "2026-03-01T22:50:46.126196Z",
  "provider_reliability": {
    "OpenAI": {
      "current_performance": {
        "latency_ms": 614,
        "model": "GPT-4o",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 467,
        "p95": 1226,
        "p99": 4957,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 100.0,
        "error_rate_percent": 0.0,
        "sla_compliance_percent": 100.0,
        "requests_24h": 7,
        "mean_time_to_respond": 879.0
      },
      "quality_grade": "A+"
    },
    "Groq": {
      "current_performance": {
        "latency_ms": 1197,
        "model": "llama-3.1-8b-instant",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 2117,
        "p95": 17236,
        "p99": 26443,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 100.0,
        "error_rate_percent": 0.0,
        "sla_compliance_percent": 100.0,
        "requests_24h": 7,
        "mean_time_to_respond": 1214.57
      },
      "quality_grade": "A+"
    },
    "Claude": {
      "current_performance": {
        "latency_ms": 1011,
        "model": "Claude Sonnet 4",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 1143,
        "p95": 2444,
        "p99": 4595,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 100.0,
        "error_rate_percent": 0.0,
        "sla_compliance_percent": 100.0,
        "requests_24h": 7,
        "mean_time_to_respond": 1026.29
      },
      "quality_grade": "A+"
    },
    "OpenRouter": {
      "current_performance": {
        "latency_ms": 419,
        "model": "Mistral",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 1019,
        "p95": 16538,
        "p99": 24985,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 100.0,
        "error_rate_percent": 0.0,
        "sla_compliance_percent": 100.0,
        "requests_24h": 7,
        "mean_time_to_respond": 526.43
      },
      "quality_grade": "A+"
    },
    "Together AI": {
      "current_performance": {
        "latency_ms": 217,
        "model": "Llama3.1-8B-Turbo",
        "status": "operational"
      },
      "percentile_analysis": {
        "p50": 406,
        "p95": 20439,
        "p99": 32963,
        "sample_size": 100
      },
      "reliability_metrics": {
        "availability_percent": 85.71,
        "error_rate_percent": 14.29,
        "sla_compliance_percent": 85.71,
        "requests_24h": 7,
        "mean_time_to_respond": 244.83
      },
      "quality_grade": "D"
    }
  },
  "platform_summary": {
    "overall_availability_percent": 97.14,
    "overall_sla_compliance_percent": 97.14,
    "total_providers_analyzed": 5,
    "grade_distribution": {
      "A+": 4,
      "A": 0,
      "B": 0,
      "C": 0,
      "D": 1
    }
  },
  "sla_targets": {
    "availability_target": "99.5%",
    "latency_target": "95% of requests under 2000ms",
    "error_rate_target": "< 0.5%"
  },
  "methodology": {
    "data_window": "24 hours",
    "percentile_calculations": "Based on last 100 successful requests",
    "grading_criteria": "Industry-standard SLA benchmarks"
  }
}