🏋️ InferBench 🏋️

A cost/quality/speed Leaderboard for Inference Providers!

{
  • "headers": [
    • "Model",
    • "Median Inference Time",
    • "Price per Image",
    • "GenEval",
    • "HPS (v2.1)",
    • "GenAI-Bench (VQA)",
    • "DrawBench (Image Reward)",
    • "PartiPromts (ARNIQA)",
    • "PartiPromts (ClipIQA)",
    • "PartiPromts (ClipScore)",
    • "PartiPromts (Sharpness - Laplacian Variance)"
    ],
  • "data": [
    • [
      • "<a target="_blank" href="https://replicate.com/prunaai/flux.1-juiced" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">Pruna [extra juiced]</a>",
      • 2.6,
      • 0.004,
      • 69.9,
      • 29.86,
      • 0.7466,
      • 0.9458,
      • 0.6591,
      • 0.8887,
      • 27.6,
      • 7997
      ],
    • [
      • "<a target="_blank" href="https://replicate.com/prunaai/flux.1-lightly-juiced" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">Pruna [lightly juiced]</a>",
      • 3.57,
      • 0.0054,
      • 69.12,
      • 30.36,
      • 0.7405,
      • 0.9972,
      • 0.6789,
      • 0.9031,
      • 27.56,
      • 7849
      ],
    • [
      • "<a target="_blank" href="https://fal.ai/models/fal-ai/flux/dev" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">fal</a>",
      • 4.06,
      • 0.025,
      • 68.72,
      • 29.97,
      • 0.7441,
      • 1.0084,
      • 0.6702,
      • 0.8967,
      • 27.61,
      • 7295
      ],
    • [
      • "<a target="_blank" href="https://replicate.com/prunaai/flux.1-juiced" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">Pruna [juiced]</a>",
      • 3.14,
      • 0.0048,
      • 68.64,
      • 30.38,
      • 0.7408,
      • 0.9657,
      • 0.6762,
      • 0.9014,
      • 27.55,
      • 7627
      ],
    • [
      • "<a target="_blank" href="https://huggingface.co/black-forest-labs/FLUX.1-dev?library=diffusers" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">Baseline [Nvidia H100]</a>",
      • 6.88,
      • 0.025,
      • 67.98,
      • 30.36,
      • 0.74,
      • 1.0072,
      • 0.6758,
      • 0.8968,
      • 27.4,
      • 6833
      ],
    • [
      • "<a target="_blank" href="https://replicate.com/black-forest-labs/flux-dev" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">Replicate [go_fast]</a>",
      • 3.38,
      • 0.025,
      • 67.41,
      • 29.25,
      • 0.7547,
      • 0.9282,
      • 0.6356,
      • 0.8609,
      • 27.56,
      • 4872
      ],
    • [
      • "<a target="_blank" href="https://fireworks.ai/models/fireworks/flux-1-dev-fp8" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">fireworks [fp8]</a>",
      • 4.66,
      • 0.014,
      • 65.55,
      • 30.26,
      • 0.7455,
      • 0.9467,
      • 0.6639,
      • 0.8478,
      • 27.24,
      • 5625
      ],
    • [
      • "<a target="_blank" href="https://www.together.ai/models/flux-1-dev" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">Together AI</a>",
      • 3.38,
      • 0.025,
      • 64.61,
      • 30.22,
      • 0.7339,
      • 0.9463,
      • 0.5752,
      • 0.8709,
      • 27.31,
      • 4501
      ]
    ],
  • "metadata": null
}
Twitter GitHub LinkedIn Discord Reddit
@article{InferBench,
    title={InferBench: A Leaderboard for Inference Providers},
    author={PrunaAI},
    year={2025},
    howpublished={\url{https://huggingface.co/spaces/PrunaAI/InferBench}}
}