{
  "@context": "https://schema.org",
  "@type": "Dataset",
  "name": "LLM API Latency Benchmark - May 2026",
  "description": "P50, P95, P99, TTFT, and output speed measurements across OpenAI, Anthropic, Google, DeepSeek, and OpenRouter models.",
  "temporalCoverage": "2026-05-01/2026-05-12",
  "generatedAt": "2026-05-12T14:00:00Z",
  "creator": "llmping",
  "methodologyUrl": "https://llmping.com/blog/measuring-llm-latency-correctly/",
  "sourceUrl": "https://llmping.com/leaderboard/",
  "rows": [
    {
      "provider": "OpenAI",
      "providerSlug": "openai",
      "model": "gpt-4o",
      "modelSlug": "gpt-4o",
      "region": "US East",
      "regionSlug": "us-east",
      "p50Ms": 342,
      "p95Ms": 891,
      "p99Ms": 1430,
      "ttftMs": 410,
      "tokensPerSecond": 72,
      "samples": 1440,
      "collectedAt": "2026-05-12T13:55:00Z"
    },
    {
      "provider": "OpenAI",
      "providerSlug": "openai",
      "model": "gpt-4o-mini",
      "modelSlug": "gpt-4o-mini",
      "region": "US West",
      "regionSlug": "us-west",
      "p50Ms": 378,
      "p95Ms": 936,
      "p99Ms": 1518,
      "ttftMs": 442,
      "tokensPerSecond": 86,
      "samples": 1440,
      "collectedAt": "2026-05-12T13:54:00Z"
    },
    {
      "provider": "Anthropic",
      "providerSlug": "anthropic",
      "model": "claude-3-5-sonnet",
      "modelSlug": "claude-3-5-sonnet",
      "region": "US East",
      "regionSlug": "us-east",
      "p50Ms": 416,
      "p95Ms": 1048,
      "p99Ms": 1640,
      "ttftMs": 492,
      "tokensPerSecond": 63,
      "samples": 1440,
      "collectedAt": "2026-05-12T13:56:00Z"
    },
    {
      "provider": "Anthropic",
      "providerSlug": "anthropic",
      "model": "claude-3-haiku",
      "modelSlug": "claude-3-haiku",
      "region": "Europe",
      "regionSlug": "europe",
      "p50Ms": 536,
      "p95Ms": 1280,
      "p99Ms": 1984,
      "ttftMs": 610,
      "tokensPerSecond": 94,
      "samples": 1440,
      "collectedAt": "2026-05-12T13:57:00Z"
    },
    {
      "provider": "Google",
      "providerSlug": "google",
      "model": "gemini-1.5-pro",
      "modelSlug": "gemini-1-5-pro",
      "region": "US East",
      "regionSlug": "us-east",
      "p50Ms": 458,
      "p95Ms": 1165,
      "p99Ms": 1880,
      "ttftMs": 535,
      "tokensPerSecond": 68,
      "samples": 1440,
      "collectedAt": "2026-05-12T13:58:00Z"
    },
    {
      "provider": "Google",
      "providerSlug": "google",
      "model": "gemini-1.5-flash",
      "modelSlug": "gemini-1-5-flash",
      "region": "Asia Pacific",
      "regionSlug": "asia-pacific",
      "p50Ms": 624,
      "p95Ms": 1490,
      "p99Ms": 2240,
      "ttftMs": 705,
      "tokensPerSecond": 102,
      "samples": 1440,
      "collectedAt": "2026-05-12T13:59:00Z"
    },
    {
      "provider": "DeepSeek",
      "providerSlug": "deepseek",
      "model": "deepseek-chat",
      "modelSlug": "deepseek-chat",
      "region": "Singapore",
      "regionSlug": "singapore",
      "p50Ms": 388,
      "p95Ms": 990,
      "p99Ms": 1570,
      "ttftMs": 456,
      "tokensPerSecond": 78,
      "samples": 1440,
      "collectedAt": "2026-05-12T14:00:00Z"
    },
    {
      "provider": "OpenRouter",
      "providerSlug": "openrouter",
      "model": "router-best",
      "modelSlug": "router-best",
      "region": "Japan",
      "regionSlug": "japan",
      "p50Ms": 710,
      "p95Ms": 1685,
      "p99Ms": 2520,
      "ttftMs": 804,
      "tokensPerSecond": 55,
      "samples": 1440,
      "collectedAt": "2026-05-12T13:52:00Z"
    },
    {
      "provider": "Groq",
      "providerSlug": "groq",
      "model": "llama-3.3-70b",
      "modelSlug": "llama-3-3-70b",
      "region": "US East",
      "regionSlug": "us-east",
      "p50Ms": 302,
      "p95Ms": 770,
      "p99Ms": 1220,
      "ttftMs": 360,
      "tokensPerSecond": 186,
      "samples": 1440,
      "collectedAt": "2026-05-12T13:53:00Z"
    },
    {
      "provider": "Together AI",
      "providerSlug": "together",
      "model": "mixtral-8x7b",
      "modelSlug": "mixtral-8x7b",
      "region": "US West",
      "regionSlug": "us-west",
      "p50Ms": 430,
      "p95Ms": 1108,
      "p99Ms": 1710,
      "ttftMs": 511,
      "tokensPerSecond": 112,
      "samples": 1440,
      "collectedAt": "2026-05-12T13:51:00Z"
    }
  ]
}