<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://www.generalcompute.com/</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>weekly</changefreq>
<priority>1</priority>
</url>
<url>
<loc>https://www.generalcompute.com/agents</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.9</priority>
</url>
<url>
<loc>https://www.generalcompute.com/openclaw</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.9</priority>
</url>
<url>
<loc>https://www.generalcompute.com/benchmarks</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.9</priority>
</url>
<url>
<loc>https://www.generalcompute.com/infrastructure</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.generalcompute.com/use-cases/coding-agents</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.generalcompute.com/use-cases/voice-ai</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.generalcompute.com/roadmap</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.generalcompute.com/team</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.generalcompute.com/careers</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.generalcompute.com/careers/head-of-infrastructure</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/careers/software-engineer-inference</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/demo</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>daily</changefreq>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.generalcompute.com/terms</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>yearly</changefreq>
<priority>0.3</priority>
</url>
<url>
<loc>https://www.generalcompute.com/privacy</loc>
<lastmod>2026-04-23T09:05:53.729Z</lastmod>
<changefreq>yearly</changefreq>
<priority>0.3</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/s3-scheduling-for-straggler-mitigation-in-llm-serving</loc>
<lastmod>2026-04-23T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/chunked-prefill-overlapping-compute-and-communication</loc>
<lastmod>2026-04-22T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/cascade-inference-using-small-models-to-route-to-big-ones</loc>
<lastmod>2026-04-21T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/lookahead-decoding-parallel-token-generation-without-draft-models</loc>
<lastmod>2026-04-20T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/disaggregated-prefill-and-decode</loc>
<lastmod>2026-04-19T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/kv-cache-compression-mla-and-beyond</loc>
<lastmod>2026-04-18T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/ring-attention-scaling-context-to-millions-of-tokens</loc>
<lastmod>2026-04-17T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/quantization-for-inference-gptq-awq-smoothquant-fp8</loc>
<lastmod>2026-03-26T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/multi-query-grouped-query-attention</loc>
<lastmod>2026-03-25T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/medusa-eagle-sequoia-next-gen-speculative-decoding</loc>
<lastmod>2026-03-24T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/sglang-and-radix-attention</loc>
<lastmod>2026-03-24T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/continuous-batching-the-orca-paper</loc>
<lastmod>2026-03-24T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/speculative-decoding-3x-speedups-without-changing-the-model</loc>
<lastmod>2026-03-23T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/paged-attention-and-vllm</loc>
<lastmod>2026-03-22T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/flash-attention-how-tri-dao-made-attention-4x-faster</loc>
<lastmod>2026-03-21T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/build-a-real-time-voice-ai-agent</loc>
<lastmod>2026-03-20T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/how-coding-agents-depend-on-inference-speed</loc>
<lastmod>2026-03-19T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.generalcompute.com/blog/why-inference-speed-is-the-new-moat</loc>
<lastmod>2026-03-18T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
</urlset>
