<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
  <!-- Static pages -->
  <url><loc>https://inferencebench.io/</loc><lastmod>2026-04-01</lastmod><changefreq>daily</changefreq><priority>1.0</priority></url>
  <url><loc>https://inferencebench.io/leaderboard/</loc><lastmod>2026-04-01</lastmod><changefreq>daily</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/models/</loc><lastmod>2026-04-01</lastmod><changefreq>daily</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/gpus/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/providers/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/calculator/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/calculator/training/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/leaderboard/training/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/community/</loc><lastmod>2026-04-01</lastmod><changefreq>daily</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/support/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/glossary/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/training/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/training/compare/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/training/methods/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/training/guide/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/privacy/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/terms/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/cookies/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.2</priority></url>
  <url><loc>https://inferencebench.io/compliance/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/safety/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/licenses/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.2</priority></url>
  <url><loc>https://inferencebench.io/api/v2/docs/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/admin/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/methodology/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/developers/</loc><lastmod>2026-04-01</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/use-case/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/use-case/chatbot/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/code-generation/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/document-analysis/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/real-time-translation/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/content-generation/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/runpod-vs-lambda/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/aws-vs-gcp/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/together-ai-vs-fireworks/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/deepseek-r1-vs-deepseek-v3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>

  <!-- GPU comparison pages -->
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-a100-80gb-sxm/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h200-sxm-vs-nvidia-h100-sxm/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-h100-pcie/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-nvidia-a100-40gb-sxm/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-rtx-4090-vs-nvidia-l40s/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-b200-sxm/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-nvidia-l40s/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-rtx-3090-vs-nvidia-rtx-4090/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-nvl-vs-nvidia-h100-sxm/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-b200-sxm-vs-nvidia-h200-sxm/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-b200-sxm-vs-nvidia-b100-sxm/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h200-sxm-vs-nvidia-a100-80gb-sxm/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-l40s/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-l40s-vs-nvidia-l40/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-nvidia-a100-80gb-pcie/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-rtx-4090-vs-nvidia-rtx-5090/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-amd-mi300x/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-amd-mi300x/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-l4-vs-nvidia-t4/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a6000-vs-nvidia-l40s/</loc><lastmod>2026-04-02</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>

  <!-- Model pages (262 models) -->
  <url><loc>https://inferencebench.io/models/01-ai/yi-1.5-34b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-1.5-9b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-coder-9b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-large/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-lightning/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/ai21/jamba-1.5-large/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/ai21/jamba-1.5-mini/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/gte-qwen2-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/marco-o1/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-1.5-moe-a2.7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2-audio-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-14b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-32b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-coder-32b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/allenai/olmo-2-13b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/allenai/olmo-2-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/amazon/nova-lite/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/amazon/nova-pro/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/apple/openelm-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/arabic/jais-30b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-base-en-v1.5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-large-en-v1.5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-m3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-small-en-v1.5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baichuan/baichuan2-13b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baichuan/baichuan2-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/octocoder-15b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/santacoder-1.1b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/starcoder2-15b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/starcoder2-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/starcoder2-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/black-forest-labs/flux-1-dev/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cerebras/btlm-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cerebras/cerebras-gpt-13b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/codellama/codellama-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cognitivecomputations/dolphin-2.9-72b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/aya-23-35b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/aya-23-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r-08-2024/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r-plus/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/embed-english-v3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/databricks/dbrx-base/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/dbrx/dbrx-instruct/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-coder-33b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-coder-6.7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-coder-v2-236b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-llm-67b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-math-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-moe-16b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-1.5b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-14b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-32b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-v2-lite/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-v2.5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-v3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-v3-0324/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/falcon/falcon-180b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/falcon/falcon-40b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/falcon/falcon-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/finance/fingpt-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/codegemma-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-1.1-2b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-2-27b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-2-2b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-2-9b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-12b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-1b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-27b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-2b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-4b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/paligemma-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/recurrentgemma-2b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/gradient/llama-3-70b-1m/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/h2o/h2o-danube3-500m/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/smollm-135m/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/smollm-360m/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/smollm2-1.7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/zephyr-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/internlm/internlm2.5-20b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/internlm/internlm2.5-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/internlm/internlm3-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/internlm/internvl2-26b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/intfloat/e5-mistral-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/intfloat/multilingual-e5-large/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/japanese/elyza-13b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/japanese/japanese-stablelm-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/jina/jina-embeddings-v3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/kaist/prometheus-2-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/korean/kullm-12.8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/legal/saullm-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/lmsys/vicuna-13b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/lmsys/vicuna-33b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/lmsys/vicuna-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/medical/biomistral-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/medical/meditron-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/codellama-13b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/codellama-34b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/codellama-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-2-13b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-2-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-2-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.1-405b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.1-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.1-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-11b-vision/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-1b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-90b-vision/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-90b-vision-instruct/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.3-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.3-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-4-maverick-400b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-4-scout-17b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-guard-3-1b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-guard-3-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/seamless-m4t-v2-large/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/florence-2-large/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/orca-2-13b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-1/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-1.5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-2/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3-medium-14b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3-mini-3.8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3-small-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3.5-moe/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3.5-vision/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-4/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-4-mini/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/wizardmath-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/minimax/minimax-text-01/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/codestral-22b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/codestral-mamba-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/ministral-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-large/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-large-2411/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-medium-3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-nemo-12b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-small-24b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-small-3.1-24b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mixtral-8x22b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mixtral-8x7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mixtral-8x7b-instruct/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/pixtral-12b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/moonshot/kimi-k2.5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mosaicml/mpt-30b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mosaicml/mpt-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nomic/nomic-embed-text-v1.5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nousresearch/hermes-3-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nousresearch/hermes-3-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/canary-1b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/helpsteer2-llama-3.1-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/llama-3.1-nemotron-51b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/llama-3.1-nemotron-70b-instruct/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/llama-3.1-nemotron-70b-reward/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/megatron-turing-530b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/minitron-4b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/minitron-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-15b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-340b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-70b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-mini-4b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nv-embed-v2/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nv-embedqa-e5-v5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nv-embedqa-mistral-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nv-retriever-v1/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/parakeet-ctc-0.6b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/parakeet-tdt-1.1b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/vila-1.5-13b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/vila-1.5-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/vila-1.5-40b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/dall-e-3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/whisper-base/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/whisper-large-v3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/whisper-medium/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/whisper-small/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-3-opus/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-3-sonnet/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-haiku-3.5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-opus-4/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-sonnet-4/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/command-a/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gemini-1.5-flash/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gemini-1.5-pro/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gemini-2.0-flash/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gemini-2.0-pro/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-3.5-turbo/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-4-turbo/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-4.5-preview/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-4o/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-4o-mini/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/grok-3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/inflection-3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/jamba-instruct/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/llama-4-behemoth/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/o1/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/o1-mini/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/o3-mini/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/reka-core/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2-vl-2b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-0.5b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-1.5b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-72b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-coder-1.5b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-coder-14b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-coder-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-coder-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-math-72b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-math-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-vl-72b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-vl-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-0.6b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-1.7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-235b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-30b-a3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-32b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-4b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-8b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/replit/replit-code-v1.5-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/rinna/nekomata-14b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/rwkv/rwkv-6-14b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sail/infoxlm-large/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/salesforce/codegen2-16b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sberbank/gigachat-20b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/scientific/sciglm-6b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sensetime/internlm-20b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sentence-transformers/all-minilm-l6-v2/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/snowflake/arctic-128x3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/snowflake/arctic-480b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/stabilityai/sdxl-1.0/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/stabilityai/stablelm-2-12b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/stabilityai/stablelm-zephyr-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/teknium/openhermes-2.5-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/thudm/chatglm3-6b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/thudm/cogvlm2-19b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-11b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-10b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-1b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-3b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-mamba-7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tinyllama/tinyllama-1.1b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tinyllama/tinyllama-1.1b-chat/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/together/llama-3.1-70b-turbo/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/upstage/solar-10.7b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/upstage/solar-pro-22b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/wizardlm/wizardcoder-33b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/xai/grok-2/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/yandex/yalm-100b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/yilai/yi-6b-200k/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/zhipu/chatglm4-9b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/zhipu/glm-4-9b/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/zhipu/glm-5/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>

  <!-- GPU pages (60 GPUs) -->
  <url><loc>https://inferencebench.io/gpus/amd-mi100/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi210/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi250x/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi300x/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi325x/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-rx-7900-xtx/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-w7900/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/aws-trainium2/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/google-tpu-v4/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/google-tpu-v5e/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/google-tpu-v6e/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/groq-lpu/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/intel-gaudi-2/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/intel-gaudi-3/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/intel-gaudi-3-hl325l/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-40gb-pcie/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-40gb-sxm/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-80gb-pcie/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-80gb-sxm/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a10g/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a16/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a2/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a30/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a40/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a4000/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a6000/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b100-sxm/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b200-nvl/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b200-sxm/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b300/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-gb200-nvl72/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-gb300-nvl72/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-gh200/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-nvl/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-nvl-94gb/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-pcie/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-sxm/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h20/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h200-sxm/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l20/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l4/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l40/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l40s/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3060/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3070/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3080/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3090/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4060/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4060-ti-16gb/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4070-super/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4070-ti/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4080/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4090/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-5090/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-6000-ada/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-a5000/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-t4/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-v100-16gb/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-v100-32gb/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/qualcomm-cloud-ai-100/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>

  <!-- Provider pages (19 providers) -->
  <url><loc>https://inferencebench.io/providers/aws/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/azure/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/coreweave/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/deepinfra/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/deepseek/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/fireworks/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/fluidstack/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gcp/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/groq/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/huggingface/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/hyperbolic/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/lambda/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/novita/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/replicate/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/runpod/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/sambanova/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/tensordock/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/together-ai/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/vast-ai/</loc><lastmod>2026-04-01</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
</urlset>
