<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://dwarez.dev</loc>
<lastmod>2026-07-03T23:35:37.633Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/about</loc>
<lastmod>2026-07-03T23:35:37.633Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/notes</loc>
<lastmod>2026-07-03T23:35:37.633Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/it</loc>
<lastmod>2026-07-03T23:35:37.633Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/turboquant-what-3-bit-kv-caches-actually</loc>
<lastmod>2026-03-28T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/transformer-attention-backwards</loc>
<lastmod>2026-03-07T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/pipeline-parallelism-surgery-on-models</loc>
<lastmod>2025-10-12T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/data-parallelism-scaling-llm-training</loc>
<lastmod>2025-09-28T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/the-memory-anatomy-of-large-language</loc>
<lastmod>2025-09-19T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/from-sequential-to-parallel-your</loc>
<lastmod>2025-06-15T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/the-transformers-anatomy-a-deep-dive</loc>
<lastmod>2025-05-29T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/move-fast-or-die-slow</loc>
<lastmod>2025-02-02T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/the-machine-learning-surgeons-guide</loc>
<lastmod>2024-12-23T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/the-operating-room-setup</loc>
<lastmod>2024-12-20T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/dissecting-torchcompile-surgical</loc>
<lastmod>2024-12-18T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/a-quick-incision-ten-minutes-to-rag</loc>
<lastmod>2024-12-12T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/performing-kernel-surgery-profiling</loc>
<lastmod>2024-12-10T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/a-machine-learning-surgeons-toolkit</loc>
<lastmod>2024-12-06T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/cerebral-cortex-and-hippocampus-understanding</loc>
<lastmod>2024-12-03T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/hello-cuda-a-surgical-dissection</loc>
<lastmod>2024-12-01T00:00:00.000Z</lastmod>
</url>
<url>
<loc>https://dwarez.dev/blog/introduction-to-sparsity-for-efficient-inference</loc>
<lastmod>2024-01-15T00:00:00.000Z</lastmod>
</url>
</urlset>
