💰 Cost Optimization Analysis

← Back to Home

💰 Most cost-efficient: Fireworks AI | 📊 7 providers analyzed
Full JSON Response (for developers & agents)
{
  "service": "InferenceLatency.com",
  "endpoint": "cost-optimizer",
  "description": "AI provider cost optimization intelligence",
  "cost_analysis": {
    "most_cost_efficient": {
      "provider": "Fireworks AI",
      "latency_ms": 349,
      "cost_per_1k_tokens_usd": 0.0002,
      "performance_score": 2.87,
      "cost_efficiency_score": 14326.65
    },
    "budget_recommendations": {
      "under_1_cent_per_1k": [
        {
          "provider": "Fireworks AI",
          "latency_ms": 349,
          "cost_per_1k_tokens_usd": 0.0002,
          "performance_score": 2.87,
          "cost_efficiency_score": 14326.65
        },
        {
          "provider": "Together AI",
          "latency_ms": 436,
          "cost_per_1k_tokens_usd": 0.0002,
          "performance_score": 2.29,
          "cost_efficiency_score": 11467.89
        },
        {
          "provider": "OpenRouter",
          "latency_ms": 1062,
          "cost_per_1k_tokens_usd": 0.00018,
          "performance_score": 0.94,
          "cost_efficiency_score": 5231.22
        },
        {
          "provider": "HF GPT OSS 120B (Cerebras)",
          "latency_ms": 289,
          "cost_per_1k_tokens_usd": 0.0008,
          "performance_score": 3.46,
          "cost_efficiency_score": 4325.26
        },
        {
          "provider": "Google Gemini",
          "latency_ms": 435,
          "cost_per_1k_tokens_usd": 0.00075,
          "performance_score": 2.3,
          "cost_efficiency_score": 3065.13
        },
        {
          "provider": "OpenAI",
          "latency_ms": 796,
          "cost_per_1k_tokens_usd": 0.0025,
          "performance_score": 1.26,
          "cost_efficiency_score": 502.51
        },
        {
          "provider": "Claude",
          "latency_ms": 2298,
          "cost_per_1k_tokens_usd": 0.003,
          "performance_score": 0.44,
          "cost_efficiency_score": 145.05
        }
      ],
      "premium_performance": [
        {
          "provider": "HF GPT OSS 120B (Cerebras)",
          "latency_ms": 289,
          "cost_per_1k_tokens_usd": 0.0008,
          "performance_score": 3.46,
          "cost_efficiency_score": 4325.26
        }
      ],
      "balanced_options": []
    },
    "savings_analysis": [
      {
        "provider": "Fireworks AI",
        "latency_ms": 349,
        "cost_per_1k_tokens_usd": 0.0002,
        "performance_score": 2.87,
        "cost_efficiency_score": 14326.65
      },
      {
        "provider": "Together AI",
        "latency_ms": 436,
        "cost_per_1k_tokens_usd": 0.0002,
        "performance_score": 2.29,
        "cost_efficiency_score": 11467.89
      },
      {
        "provider": "OpenRouter",
        "latency_ms": 1062,
        "cost_per_1k_tokens_usd": 0.00018,
        "performance_score": 0.94,
        "cost_efficiency_score": 5231.22
      },
      {
        "provider": "HF GPT OSS 120B (Cerebras)",
        "latency_ms": 289,
        "cost_per_1k_tokens_usd": 0.0008,
        "performance_score": 3.46,
        "cost_efficiency_score": 4325.26
      },
      {
        "provider": "Google Gemini",
        "latency_ms": 435,
        "cost_per_1k_tokens_usd": 0.00075,
        "performance_score": 2.3,
        "cost_efficiency_score": 3065.13
      },
      {
        "provider": "OpenAI",
        "latency_ms": 796,
        "cost_per_1k_tokens_usd": 0.0025,
        "performance_score": 1.26,
        "cost_efficiency_score": 502.51
      },
      {
        "provider": "Claude",
        "latency_ms": 2298,
        "cost_per_1k_tokens_usd": 0.003,
        "performance_score": 0.44,
        "cost_efficiency_score": 145.05
      }
    ]
  },
  "optimization_guidance": {
    "cost_conscious": "Choose providers with highest cost_efficiency_score",
    "performance_critical": "Choose providers with lowest latency_ms",
    "balanced_approach": "Consider balanced_options for optimal cost-performance ratio"
  },
  "providers_tested": 7,
  "timestamp": "2025-09-07T23:19:23.005070Z"
}