<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
  <url><loc>https://spotinference.com/</loc><changefreq>weekly</changefreq><priority>1.0</priority></url>
  <url><loc>https://spotinference.com/economics</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/pricing</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/learn</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/engines</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/hardware</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/reliability</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/trust</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/api</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/reference</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/glossary</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/research</loc><changefreq>weekly</changefreq><priority>0.8</priority></url>
  <url><loc>https://spotinference.com/glossary/cold-start</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/continuous-batching</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/kv-cache</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/paged-attention</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/pipeline-parallelism</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/quantisation</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/structured-output</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/tensor-parallelism</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/tool-calls</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/ttft</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/fp8-quantization</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/speculative-decoding</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/mixture-of-experts</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/spot-vs-on-demand-gpu</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/openai-compatible-api</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/cold-start-wake-latency</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/context-window</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/glossary/prefill-vs-decode</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/awq</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/gptq</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/lean-stack-engineering</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/orca-continuous-batching</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/paged-attention</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/speculative-decoding</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/vllm-engine</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/h100-vs-a100-measured-throughput</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/anatomy-of-a-gpu-wake</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/invoice-true-cost-per-mtok</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/migrating-from-openai</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/retries-timeouts-backoff</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/streaming-responses</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/structured-output-and-tool-calls</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/gateway-vs-self-hosting-vllm</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/spot-vs-on-demand-inference</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/kv-cache-latency-and-cost</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
  <url><loc>https://spotinference.com/research/what-a-cold-start-costs</loc><changefreq>monthly</changefreq><priority>0.6</priority></url>
</urlset>
