<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
  <!-- Auto-generated by scripts/generate-sitemap.mjs from out/ -->

  <url><loc>https://inferencebench.io/</loc><lastmod>2026-06-17</lastmod><changefreq>daily</changefreq><priority>1.0</priority></url>
  <url><loc>https://inferencebench.io/bench/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/changelog/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-audit/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-bundle/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-cache/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-ci/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-compare/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-cost/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-diff/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-doctor/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-export/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-fetch/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-history/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-leaderboard/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-list/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-matrix/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-plugin/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-profile/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-publish/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-replay/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-run/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-schema/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-summary/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-verify/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/bench-watch/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/cli/overview/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/community/code-of-conduct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/community/contributing/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/community/discussions/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/community/security/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/concepts/envelope/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/concepts/fingerprinting/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/concepts/methodology/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/concepts/pareto/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/concepts/reproducibility/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/concepts/vendor-neutrality/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/faq/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/install/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/integrations/github-actions/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/integrations/huggingface-hub/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/plugins/llm-inference/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/plugins/overview/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/quickstart/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/audit/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/ci-integration/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/concurrency-sweep/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/cross-model/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/docker/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/multi-vendor-marathon/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/multi-vendor-matrix/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/regression-check/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/reproducibility/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/sigstore-verification/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/recipes/voice-asr/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/reference/cli-reference/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/reference/envelope-schema/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/docs/tour/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/bench/leaderboard/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/blog/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/blog/benchmarking-nvidia-alpamayo-1-5-10b-h100/</loc><lastmod>2026-04-09</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/flux2-klein-4b-image-generation-benchmark/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/gemma-4-31b-h100-complete-inference-benchmark/</loc><lastmod>2026-04-09</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/gemma-4-vs-moe-dense-model-wins/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/gpu-memory-wall-forecasting-ai-demand-2028/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/minimax-m25-229b-moe-honest-benchmark/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/minimax-m25-vs-m27-doubling-moe-params/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/minimax-m27-456b-bigger-moe-paradox/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/nemotron-super-120b-vs-ultra-253b-nvidia-showdown/</loc><lastmod>2026-04-14</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/nvidia-rubin-vera-next-gpu-revolution/</loc><lastmod>2026-04-12</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/qwen3-coder-the-model-that-does-everything-right/</loc><lastmod>2026-04-14</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/blog/whisper-large-v3-turbo-597x-realtime-asr-benchmark/</loc><lastmod>2026-04-13</lastmod><changefreq>monthly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/calculator/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/calculator/training/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/community/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-34b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-1.5-9b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-coder-9b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-large-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/01-ai--yi-lightning-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-large-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/ai21--jamba-1.5-mini-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--gte-qwen2-7b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--marco-o1-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-1.5-moe-a2.7b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2-audio-7b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-14b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-32b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-3b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/alibaba--qwen-2.5-coder-32b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--molmo-72b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-13b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/allenai--olmo-2-7b-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-lite-vs-amazon--nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-01-ai--yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-01-ai--yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-01-ai--yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-01-ai--yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-01-ai--yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-ai21--jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-ai21--jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-alibaba--gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-alibaba--marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-alibaba--qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-alibaba--qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-alibaba--qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-alibaba--qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-alibaba--qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-alibaba--qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-allenai--molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-allenai--olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-allenai--olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare-models/amazon--nova-pro-vs-amazon--nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/compare/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/aws-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/aws-vs-gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/aws-vs-runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/deepinfra-vs-fireworks/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/deepinfra-vs-together-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/gcp-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/groq-vs-deepinfra/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/groq-vs-fireworks/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/groq-vs-together-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/lambda-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/runpod-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/runpod-vs-lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/runpod-vs-vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/together-ai-vs-fireworks/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compare/providers/together-ai-vs-replicate/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/compliance/</loc><lastmod>2026-06-17</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/cookies/</loc><lastmod>2026-06-17</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/01-ai/yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/01-ai/yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/01-ai/yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/01-ai/yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/01-ai/yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/ai21/jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/ai21/jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/alibaba/gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/alibaba/marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/alibaba/qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/alibaba/qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/alibaba/qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/alibaba/qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/alibaba/qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/alibaba/qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/allenai/molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/allenai/olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/allenai/olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/amazon/nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/amazon/nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/apple/openelm-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/arabic/jais-30b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/baai/bge-base-en-v1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/baai/bge-large-en-v1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/baai/bge-m3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/baai/bge-small-en-v1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/baichuan/baichuan2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/baichuan/baichuan2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/bigcode/octocoder-15b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/bigcode/santacoder-1.1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/bigcode/starcoder2-15b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/bigcode/starcoder2-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/bigcode/starcoder2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/black-forest-labs/flux-1-dev/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/black-forest-labs/flux-2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cerebras/btlm-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cerebras/cerebras-gpt-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/codellama/codellama-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cognitivecomputations/dolphin-2.9-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cohere/aya-23-35b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cohere/aya-23-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cohere/command-r-08-2024/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cohere/command-r-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cohere/command-r-plus/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cohere/command-r/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/cohere/embed-english-v3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/databricks/dbrx-base/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/dbrx/dbrx-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-coder-33b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-coder-6.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-coder-v2-236b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-llm-67b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-math-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-moe-16b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-r1-distill-1.5b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-r1-distill-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-r1-distill-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-r1-distill-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-r1-distill-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-r1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-v2-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-v2.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-v3-0324/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/deepseek-v3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/deepseek/janus-pro-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/falcon/falcon-180b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/falcon/falcon-40b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/falcon/falcon-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/finance/fingpt-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/codegemma-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemini-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-1.1-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-2-27b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-2-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-2-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-3-12b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-3-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-3-27b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-3-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-3-4b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/gemma-4-31b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/paligemma-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/google/recurrentgemma-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/gradient/llama-3-70b-1m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/h2o/h2o-danube3-500m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/huggingface/kokoro-82m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/huggingface/smollm-135m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/huggingface/smollm-360m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/huggingface/smollm2-1.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/huggingface/zephyr-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/internlm/internlm2.5-20b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/internlm/internlm2.5-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/internlm/internlm3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/internlm/internvl2-26b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/intfloat/e5-mistral-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/intfloat/multilingual-e5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/japanese/elyza-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/japanese/japanese-stablelm-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/jina/jina-embeddings-v3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/kaist/prometheus-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/korean/kullm-12.8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/legal/saullm-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/lmsys/vicuna-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/lmsys/vicuna-33b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/lmsys/vicuna-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/medical/biomistral-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/medical/meditron-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/codellama-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/codellama-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/codellama-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-2-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.1-405b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.1-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.1-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.2-11b-vision/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.2-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.2-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.2-90b-vision-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.2-90b-vision/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.3-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-3.3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-4-maverick-400b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-4-scout-17b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-guard-3-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta-llama/llama-guard-3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/meta/seamless-m4t-v2-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/florence-2-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/orca-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-3-medium-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-3-mini-3.8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-3-small-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-3.5-moe/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-3.5-vision/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-4-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/phi-4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/microsoft/wizardmath-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/minimax/minimax-m2-7/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/minimax/minimax-text-01/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/codestral-22b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/codestral-mamba-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/ministral-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mistral-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mistral-large-2411/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mistral-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mistral-medium-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mistral-nemo-12b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mistral-small-24b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mistral-small-3.1-24b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mixtral-8x22b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mixtral-8x7b-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/mixtral-8x7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mistral/pixtral-12b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/moonshot/kimi-k2.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mosaicml/mpt-30b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/mosaicml/mpt-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nomic/nomic-embed-text-v1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nousresearch/hermes-3-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nousresearch/hermes-3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/alpamayo-10b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/canary-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/cosmos-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/eagle-2-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/eagle-2-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/eagle-2.5-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/helpsteer2-llama-3.1-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/llama-3.1-nemotron-51b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/llama-3.1-nemotron-70b-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/llama-3.1-nemotron-70b-reward/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/megatron-turing-530b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/minitron-4b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/minitron-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nemotron-15b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nemotron-340b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nemotron-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nemotron-mini-4b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nemotron-super-120b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nemotron-ultra-253b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nv-embed-v2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nv-embedqa-e5-v5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nv-embedqa-mistral-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nv-retriever-v1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/nvlm-d-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/parakeet-ctc-0.6b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/parakeet-tdt-1.1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/vila-1.5-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/vila-1.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/nvidia/vila-1.5-40b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/openai/dall-e-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/openai/whisper-base/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/openai/whisper-large-v3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/openai/whisper-medium/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/openai/whisper-small/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-3-opus/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-3-sonnet/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-haiku-3.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-haiku-4-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-opus-4-1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-opus-4-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-opus-4-6/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-opus-4-7/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-opus-4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-sonnet-3-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-sonnet-4-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-sonnet-4-6/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/claude-sonnet-4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/command-a/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gemini-1.5-flash/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gemini-1.5-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gemini-2.0-flash/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gemini-2.0-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gpt-3.5-turbo/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gpt-4-turbo/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gpt-4.5-preview/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gpt-4o-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gpt-4o/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gpt-5-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gpt-5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gpt-5-nano/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/gpt-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/grok-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/inflection-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/jamba-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/llama-4-behemoth/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/o1-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/o3-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/proprietary/reka-core/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2-vl-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-0.5b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-1.5b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-coder-1.5b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-coder-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-coder-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-coder-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-math-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-math-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-vl-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-2.5-vl-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-3-0.6b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-3-1.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-3-235b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-3-30b-a3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-3-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-3-4b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/qwen/qwen-3-coder-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/replit/replit-code-v1.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/rinna/nekomata-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/rwkv/rwkv-6-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/sail/infoxlm-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/salesforce/codegen2-16b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/sberbank/gigachat-20b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/scientific/sciglm-6b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/sensetime/internlm-20b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/sentence-transformers/all-minilm-l6-v2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/sesame/csm-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/snowflake/arctic-128x3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/snowflake/arctic-480b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/stabilityai/sdxl-1.0/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/stabilityai/stablelm-2-12b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/stabilityai/stablelm-zephyr-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/teknium/openhermes-2.5-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/thudm/chatglm3-6b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/thudm/cogvlm2-19b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/tiiuae/falcon-11b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/tiiuae/falcon-3-10b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/tiiuae/falcon-3-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/tiiuae/falcon-3-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/tiiuae/falcon-3-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/tiiuae/falcon-mamba-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/tinyllama/tinyllama-1.1b-chat/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/tinyllama/tinyllama-1.1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/together/llama-3.1-70b-turbo/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/upstage/solar-10.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/upstage/solar-pro-22b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/vikhyat/moondream-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/wizardlm/wizardcoder-33b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/xai/grok-2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/xai/grok-3-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/xai/grok-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/xai/grok-4-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/xai/grok-4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/yandex/yalm-100b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/yilai/yi-6b-200k/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/zhipu/chatglm4-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/zhipu/glm-4-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/cost-to-run/zhipu/glm-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/data-license/</loc><lastmod>2026-06-17</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/developers/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/glossary/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi100/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi210/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi250x/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi300x/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-mi325x/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-rx-7900-xtx/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/amd-w7900/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/aws-trainium2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-amd-mi300x/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-nvidia-a100-40gb-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-nvidia-a100-80gb-pcie/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a100-80gb-sxm-vs-nvidia-l40s/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-a6000-vs-nvidia-l40s/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-b200-sxm-vs-nvidia-b100-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-b200-sxm-vs-nvidia-h200-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-nvl-vs-nvidia-h100-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-amd-mi300x/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-a100-80gb-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-b200-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-h100-pcie/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h100-sxm-vs-nvidia-l40s/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h200-sxm-vs-nvidia-a100-80gb-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-h200-sxm-vs-nvidia-h100-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-l4-vs-nvidia-t4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-l40s-vs-nvidia-l40/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-rtx-3090-vs-nvidia-rtx-4090/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-rtx-4090-vs-nvidia-l40s/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/compare/nvidia-rtx-4090-vs-nvidia-rtx-5090/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/gpus/google-tpu-v4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/google-tpu-v5e/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/google-tpu-v6e/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/groq-lpu/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/intel-gaudi-2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/intel-gaudi-3-hl325l/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/intel-gaudi-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-40gb-pcie/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-40gb-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-80gb-pcie/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a100-80gb-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a10g/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a16/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a30/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a40/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a4000/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-a6000/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b100-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b200-nvl/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b200-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-b300/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-gb200-nvl72/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-gb300-nvl72/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-gh200/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-nvl-94gb/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-nvl/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-pcie/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h100-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h20/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-h200-sxm/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l20/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l40/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-l40s/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3060/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3070/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3080/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-3090/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4060-ti-16gb/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4060/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4070-super/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4070-ti/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4080/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-4090/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-5090/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-6000-ada/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-rtx-a5000/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-t4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-v100-16gb/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/nvidia-v100-32gb/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/gpus/qualcomm-cloud-ai-100/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/data-centers/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/ixps/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/leaderboard/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/infrastructure/sustainability/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/leaderboard/</loc><lastmod>2026-06-17</lastmod><changefreq>daily</changefreq><priority>1.0</priority></url>
  <url><loc>https://inferencebench.io/leaderboard/training/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/licenses/</loc><lastmod>2026-06-17</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/methodology/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/methodology/inference-score/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/models/</loc><lastmod>2026-06-17</lastmod><changefreq>daily</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-1.5-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-1.5-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-coder-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/01-ai/yi-lightning/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/ai21/jamba-1.5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/ai21/jamba-1.5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/gte-qwen2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/marco-o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-1.5-moe-a2.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2-audio-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/alibaba/qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/allenai/molmo-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/allenai/olmo-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/allenai/olmo-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/amazon/nova-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/amazon/nova-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/apple/openelm-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/arabic/jais-30b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-base-en-v1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-large-en-v1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-m3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baai/bge-small-en-v1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baichuan/baichuan2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/baichuan/baichuan2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/octocoder-15b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/santacoder-1.1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/starcoder2-15b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/starcoder2-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/bigcode/starcoder2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/black-forest-labs/flux-1-dev/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/black-forest-labs/flux-2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cerebras/btlm-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cerebras/cerebras-gpt-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/codellama/codellama-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cognitivecomputations/dolphin-2.9-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/aya-23-35b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/aya-23-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r-08-2024/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r-plus/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/command-r/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/cohere/embed-english-v3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/databricks/dbrx-base/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/dbrx/dbrx-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-coder-33b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-coder-6.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-coder-v2-236b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-llm-67b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-math-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-moe-16b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-1.5b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1-distill-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-r1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-v2-lite/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-v2.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-v3-0324/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/deepseek-v3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/deepseek/janus-pro-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/falcon/falcon-180b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/falcon/falcon-40b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/falcon/falcon-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/finance/fingpt-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/codegemma-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemini-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-1.1-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-2-27b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-2-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-2-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-12b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-27b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-3-4b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/gemma-4-31b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/paligemma-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/google/recurrentgemma-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/gradient/llama-3-70b-1m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/h2o/h2o-danube3-500m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/kokoro-82m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/smollm-135m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/smollm-360m/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/smollm2-1.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/huggingface/zephyr-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/internlm/internlm2.5-20b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/internlm/internlm2.5-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/internlm/internlm3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/internlm/internvl2-26b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/intfloat/e5-mistral-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/intfloat/multilingual-e5-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/japanese/elyza-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/japanese/japanese-stablelm-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/jina/jina-embeddings-v3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/kaist/prometheus-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/korean/kullm-12.8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/legal/saullm-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/lmsys/vicuna-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/lmsys/vicuna-33b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/lmsys/vicuna-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/medical/biomistral-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/medical/meditron-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/codellama-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/codellama-34b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/codellama-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-2-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-2-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.1-405b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.1-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.1-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-11b-vision/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-90b-vision-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.2-90b-vision/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.3-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-3.3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-4-maverick-400b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-4-scout-17b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-guard-3-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta-llama/llama-guard-3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/meta/seamless-m4t-v2-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/florence-2-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/orca-2-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3-medium-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3-mini-3.8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3-small-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3.5-moe/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-3.5-vision/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-4-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/phi-4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/microsoft/wizardmath-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/minimax/minimax-m2-7/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/minimax/minimax-text-01/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/codestral-22b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/codestral-mamba-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/ministral-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-large-2411/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-medium-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-nemo-12b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-small-24b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mistral-small-3.1-24b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mixtral-8x22b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mixtral-8x7b-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/mixtral-8x7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mistral/pixtral-12b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/moonshot/kimi-k2.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mosaicml/mpt-30b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/mosaicml/mpt-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nomic/nomic-embed-text-v1.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nousresearch/hermes-3-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nousresearch/hermes-3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/alpamayo-10b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/canary-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/cosmos-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/eagle-2-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/eagle-2-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/eagle-2.5-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/helpsteer2-llama-3.1-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/llama-3.1-nemotron-51b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/llama-3.1-nemotron-70b-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/llama-3.1-nemotron-70b-reward/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/megatron-turing-530b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/minitron-4b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/minitron-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-15b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-340b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-70b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-mini-4b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-super-120b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nemotron-ultra-253b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nv-embed-v2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nv-embedqa-e5-v5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nv-embedqa-mistral-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nv-retriever-v1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/nvlm-d-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/parakeet-ctc-0.6b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/parakeet-tdt-1.1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/vila-1.5-13b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/vila-1.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/nvidia/vila-1.5-40b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/dall-e-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/gpt-5-5-instant/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/gpt-5-5-with-trusted-access-for-cyber/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/whisper-base/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/whisper-large-v3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/whisper-medium/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/openai/whisper-small/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-3-opus/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-3-sonnet/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-haiku-3.5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-haiku-4-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-opus-4-1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-opus-4-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-opus-4-6/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-opus-4-7/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-opus-4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-sonnet-3-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-sonnet-4-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-sonnet-4-6/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/claude-sonnet-4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/command-a/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gemini-1.5-flash/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gemini-1.5-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gemini-2.0-flash/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gemini-2.0-pro/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-3.5-turbo/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-4-turbo/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-4.5-preview/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-4o-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-4o/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-5-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-5-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-5-nano/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/gpt-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/grok-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/inflection-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/jamba-instruct/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/llama-4-behemoth/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/o1-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/o1/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/o3-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/proprietary/reka-core/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2-vl-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-0.5b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-1.5b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-coder-1.5b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-coder-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-coder-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-coder-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-coder-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-math-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-math-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-vl-72b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-2.5-vl-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-0.6b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-1.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-235b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-30b-a3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-32b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-4b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/qwen/qwen-3-coder-8b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/replit/replit-code-v1.5-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/rinna/nekomata-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/rwkv/rwkv-6-14b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sail/infoxlm-large/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/salesforce/codegen2-16b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sberbank/gigachat-20b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/scientific/sciglm-6b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sensetime/internlm-20b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sentence-transformers/all-minilm-l6-v2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/sesame/csm-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/snowflake/arctic-128x3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/snowflake/arctic-480b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/stabilityai/sdxl-1.0/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/stabilityai/stablelm-2-12b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/stabilityai/stablelm-zephyr-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/teknium/openhermes-2.5-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/thudm/chatglm3-6b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/thudm/cogvlm2-19b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-11b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-10b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-3b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-3-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tiiuae/falcon-mamba-7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tinyllama/tinyllama-1.1b-chat/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/tinyllama/tinyllama-1.1b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/together/llama-3.1-70b-turbo/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/upstage/solar-10.7b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/upstage/solar-pro-22b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/vikhyat/moondream-2b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/wizardlm/wizardcoder-33b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/xai/grok-2/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/xai/grok-3-mini/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/xai/grok-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/xai/grok-4-3/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/xai/grok-4/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/yandex/yalm-100b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/yilai/yi-6b-200k/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/zhipu/chatglm4-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/zhipu/glm-4-9b/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/models/zhipu/glm-5/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/pricing/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/privacy/</loc><lastmod>2026-06-17</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/providers/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://inferencebench.io/providers/aws/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/aws/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/azure/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/coreweave/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/deepinfra/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/deepinfra/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/deepseek/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/deepseek/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/fireworks/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/fireworks/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/fluidstack/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/fluidstack/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gcp/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/gpu-finder/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/groq/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/groq/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/huggingface/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/huggingface/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/hyperbolic/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/hyperbolic/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/lambda/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/novita/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/novita/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/replicate/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/replicate/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/runpod/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/sambanova/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/sambanova/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/tensordock/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/tensordock/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/together-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/together-ai/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/providers/vast-ai/reviews/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/safety/</loc><lastmod>2026-06-17</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/status/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/support/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/terms/</loc><lastmod>2026-06-17</lastmod><changefreq>monthly</changefreq><priority>0.3</priority></url>
  <url><loc>https://inferencebench.io/use-case/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/chatbot/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/code-generation/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/content-generation/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/document-analysis/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/use-case/real-time-translation/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.7</priority></url>
  <url><loc>https://inferencebench.io/vs/aws-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/aws-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/aws-vs-fluidstack/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/aws-vs-gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/aws-vs-lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/aws-vs-runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/aws-vs-tensordock/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/aws-vs-vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/azure-vs-aws/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/azure-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/azure-vs-fluidstack/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/azure-vs-gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/azure-vs-lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/azure-vs-runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/azure-vs-tensordock/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/azure-vs-vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/coreweave-vs-aws/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/coreweave-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/coreweave-vs-fluidstack/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/coreweave-vs-gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/coreweave-vs-lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/coreweave-vs-runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/coreweave-vs-tensordock/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/coreweave-vs-vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/fluidstack-vs-aws/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/fluidstack-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/fluidstack-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/fluidstack-vs-gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/fluidstack-vs-lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/fluidstack-vs-runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/fluidstack-vs-tensordock/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/fluidstack-vs-vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/gcp-vs-aws/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/gcp-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/gcp-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/gcp-vs-fluidstack/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/gcp-vs-lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/gcp-vs-runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/gcp-vs-tensordock/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/gcp-vs-vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/lambda-vs-aws/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/lambda-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/lambda-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/lambda-vs-fluidstack/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/lambda-vs-gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/lambda-vs-runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/lambda-vs-tensordock/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/lambda-vs-vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/runpod-vs-aws/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/runpod-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/runpod-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/runpod-vs-fluidstack/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/runpod-vs-gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/runpod-vs-lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/runpod-vs-tensordock/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/runpod-vs-vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/tensordock-vs-aws/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/tensordock-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/tensordock-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/tensordock-vs-fluidstack/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/tensordock-vs-gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/tensordock-vs-lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/tensordock-vs-runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/tensordock-vs-vast-ai/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/vast-ai-vs-aws/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/vast-ai-vs-azure/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/vast-ai-vs-coreweave/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/vast-ai-vs-fluidstack/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/vast-ai-vs-gcp/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/vast-ai-vs-lambda/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/vast-ai-vs-runpod/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/vs/vast-ai-vs-tensordock/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/workload-matcher/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.9</priority></url>
  <url><loc>https://inferencebench.io/workload-matcher/history/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
  <url><loc>https://inferencebench.io/workload-matcher/pricing/</loc><lastmod>2026-06-17</lastmod><changefreq>weekly</changefreq><priority>0.5</priority></url>
</urlset>
