<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
  <!-- Auto-generated by scripts/generate-sitemap.mjs — do not edit manually -->

  <!-- Static pages -->
  <url><loc>https://inferencebench.io/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>1.0</priority></url>
  <url><loc>https://inferencebench.io/leaderboard/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/models/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/calculator/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/gpus/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/providers/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/compare/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/use-case/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/calculator/training/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/workload-matcher/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/leaderboard/training/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/community/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/methodology/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/developers/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/glossary/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/support/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/api/v2/docs/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/use-case/chatbot/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/code-generation/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/document-analysis/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/real-time-translation/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/content-generation/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/runpod-vs-lambda/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/aws-vs-gcp/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/together-ai-vs-fireworks/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/deepseek-r1-vs-deepseek-v3/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-a100-80gb-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h200-sxm-vs-nvidia-h100-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-h100-pcie/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-nvidia-a100-40gb-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-rtx-4090-vs-nvidia-l40s/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-b200-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-nvidia-l40s/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-rtx-3090-vs-nvidia-rtx-4090/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-nvl-vs-nvidia-h100-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-b200-sxm-vs-nvidia-h200-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-b200-sxm-vs-nvidia-b100-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h200-sxm-vs-nvidia-a100-80gb-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-l40s/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-l40s-vs-nvidia-l40/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-nvidia-a100-80gb-pcie/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-rtx-4090-vs-nvidia-rtx-5090/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-amd-mi300x/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-amd-mi300x/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-l4-vs-nvidia-t4/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a6000-vs-nvidia-l40s/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-1.5-34b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-1.5-9b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-coder-9b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-large/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-lightning/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/ai21/jamba-1.5-large/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/ai21/jamba-1.5-mini/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/gte-qwen2-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/marco-o1/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-1.5-moe-a2.7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2-audio-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-14b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-32b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-coder-32b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/allenai/olmo-2-13b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/allenai/olmo-2-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/amazon/nova-lite/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/amazon/nova-pro/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/apple/openelm-3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/arabic/jais-30b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-base-en-v1.5/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-large-en-v1.5/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-m3/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigscience/bloom-176b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigscience/bloom-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bytedance/doubao-pro-32b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bytedance/doubao-pro-4b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cerebras/btlm-3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cerebras/cerebras-gpt-13b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r-plus/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/embed-english-v3.0/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/rerank-english-v3.0/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/databricks/dbrx-132b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-coder-v2-236b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-llama-70b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-qwen-32b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-v3/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/eleutherai/gpt-j-6b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/eleutherai/gpt-neox-20b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/eleutherai/pythia-12b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/eleutherai/pythia-6.9b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/flan-t5-xxl-11b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemini-1.5-flash/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemini-1.5-pro/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemini-2.0-flash/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemini-2.5-pro/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-2-27b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-2-2b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-2-9b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-12b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-1b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-27b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-4b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-4-12b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-4-27b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-4-31b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-4-5b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/palm-2-340b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/recurrentgemma-9b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/t5-3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/smollm-135m/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/smollm-360m/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/smollm2-1.7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/starcoder2-15b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/starcoder2-3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/starcoder2-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/ibm/granite-20b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/ibm/granite-3.0-8b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/ibm/granite-34b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/inflection/inflection-2.5-40b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/intel/neural-chat-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/jina/jina-embeddings-v2/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/jina/jina-embeddings-v3/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/jina/jina-reranker-v2-turbo/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/kaist/prometheus-2-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/codellama-34b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/codellama-70b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/codellama-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-2-13b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-2-70b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-2-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3-70b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3-8b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3.1-405b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3.1-70b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3.1-8b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3.2-11b-vision/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3.2-1b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3.2-3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3.2-90b-vision/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-3.3-70b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-4-maverick-400b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/llama-4-scout-109b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/biogpt-1.5b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-1.5-1.3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-2-2.7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3-medium-14b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3-mini-3.8b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3-small-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3.5-mini-3.8b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3.5-moe-42b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-4-14b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-4-mini-3.8b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-4-multimodal-5.6b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-4-reasoning-14b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-4-reasoning-plus-14b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/wizardlm-2-8x22b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/minimax/minimax-m1-40b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/minimax/minimax-m1-80b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/minimax/minimax-m25-229b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/minimax/minimax-m27-456b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/codestral-22b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/mistral-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/mistral-large-2-123b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/mistral-medium-3-25b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/mistral-nemo-12b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/mistral-small-3-24b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/mistral-small-3.1-24b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/mixtral-8x22b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/mixtral-8x7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistralai/pixtral-12b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mosaic/mpt-30b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mosaic/mpt-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/naver/hyperclova-x-82b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/naver/hyperclova2-128b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nexusflow/starling-lm-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nous/hermes-2-34b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/alpamayo-1.5-10b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/cosmos-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/llama-3.1-nemotron-70b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-4-15b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-4-340b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-h-56b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nvlm-72b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/chatgpt-4o-latest/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/gpt-3.5-turbo/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/gpt-4-turbo/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/gpt-4.1/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/gpt-4.1-mini/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/gpt-4.1-nano/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/gpt-4o/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/gpt-4o-mini/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/o1/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/o1-mini/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/o1-pro/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/o3/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/o3-mini/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/o3-pro/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/o4-mini/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/text-embedding-3-large/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/text-embedding-3-small/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/whisper-large-v3/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openbmb/minicpm-2b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openbmb/minicpm-v-2.6-8b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/reka/reka-core-67b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/reka/reka-flash-21b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/rwkv/rwkv-5-14b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/rwkv/rwkv-6-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/rwkv/rwkv-7-2.9b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/salesforce/codegen2-16b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sberbank/gigachat-20b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/scientific/sciglm-6b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sensetime/internlm-20b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sentence-transformers/all-minilm-l6-v2/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/snowflake/arctic-128x3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/snowflake/arctic-480b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/stabilityai/sdxl-1.0/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/stabilityai/stablelm-2-12b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/stabilityai/stablelm-zephyr-3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/teknium/openhermes-2.5-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/thudm/chatglm3-6b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/thudm/cogvlm2-19b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-11b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-10b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-1b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-3b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-mamba-7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tinyllama/tinyllama-1.1b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tinyllama/tinyllama-1.1b-chat/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/together/llama-3.1-70b-turbo/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/upstage/solar-10.7b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/upstage/solar-pro-22b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/wizardlm/wizardcoder-33b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/xai/grok-2/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/yandex/yalm-100b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/yilai/yi-6b-200k/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/zhipu/chatglm4-9b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/zhipu/glm-4-9b/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/zhipu/glm-5/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi100/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi210/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi250x/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi300x/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi325x/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-rx-7900-xtx/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-w7900/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/aws-trainium2/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/google-tpu-v4/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/google-tpu-v5e/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/google-tpu-v6e/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/groq-lpu/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/intel-gaudi-2/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/intel-gaudi-3/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/intel-gaudi-3-hl325l/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-40gb-pcie/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-40gb-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-80gb-pcie/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-80gb-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a10g/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a16/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a2/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a30/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a40/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a4000/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a6000/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b100-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b200-nvl/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b200-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b300/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-gb200-nvl72/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-gb300-nvl72/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-gh200/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-nvl/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-nvl-94gb/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-pcie/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h20/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h200-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l20/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l4/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l40/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l40s/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3060/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3070/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3080/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3090/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4060/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4060-ti-16gb/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4070-super/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4070-ti/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4080/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4090/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-5090/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-6000-ada/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-a5000/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-t4/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-v100-16gb/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-v100-32gb/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/qualcomm-cloud-ai-100/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/providers/aws/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/azure/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/coreweave/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/deepinfra/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/deepseek/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/fireworks/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/fluidstack/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gcp/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/groq/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/huggingface/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/hyperbolic/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/lambda/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/novita/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/replicate/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/runpod/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/sambanova/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/tensordock/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/together-ai/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/vast-ai/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/sustainability/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/ixps/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/leaderboard/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/united-states/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/united-kingdom/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/germany/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/japan/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/singapore/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/australia/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/france/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/netherlands/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/canada/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/india/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/brazil/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/south-korea/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/ireland/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/sweden/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/norway/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/china/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/hong-kong/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/taiwan/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/finland/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/switzerland/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/h100-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/a100-80gb-sxm/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/h200/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/l40s/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/rtx-4090/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/a6000/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/l4/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/rtx-3090/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/b200/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/rtx-5090/</loc><lastmod>2026-04-12</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/privacy/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/terms/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/cookies/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.2</priority></url>
  <url><loc>https://inferencebench.io/compliance/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/safety/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/licenses/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.2</priority></url>

  <!-- Blog pages (auto-discovered) -->
  <url><loc>https://inferencebench.io/blog/</loc><lastmod>2026-04-12</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/blog/gemma-4-vs-moe-dense-model-wins/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/gpu-memory-wall-forecasting-ai-demand-2028/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/minimax-m25-229b-moe-honest-benchmark/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/minimax-m25-vs-m27-doubling-moe-params/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/minimax-m27-456b-bigger-moe-paradox/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/nvidia-rubin-vera-next-gpu-revolution/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/benchmarking-nvidia-alpamayo-1-5-10b-h100/</loc><lastmod>2026-04-09</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/gemma-4-31b-h100-complete-inference-benchmark/</loc><lastmod>2026-04-09</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
</urlset>
