<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://datta0.github.io/posts/rethink-lora-init/</loc>
<lastmod>2026-03-23T19:20:14+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/posts/transformer-showdown/</loc>
<lastmod>2025-06-14T18:32:02+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/posts/transformer-imagined/</loc>
<lastmod>2025-06-15T20:19:27+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/posts/understanding-multi-gpu-parallelism-paradigms/</loc>
<lastmod>2026-02-24T21:37:53+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/posts/exploring-the-moe/</loc>
<lastmod>2026-02-25T16:28:36+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/posts/the-lore-behind-lora/</loc>
<lastmod>2026-03-25T10:02:50+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/categories/</loc>
<lastmod>2026-03-25T10:03:18+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/tags/</loc>
<lastmod>2026-03-25T10:03:18+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/archives/</loc>
<lastmod>2026-03-25T10:03:18+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/about/</loc>
<lastmod>2026-03-25T10:03:18+05:30</lastmod>
</url>
<url>
<loc>https://datta0.github.io/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/lora/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/fine-tuning/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/llm/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/mla/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/mha/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/gqa/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/multi-latent-attention/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/ngpt/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/differential-transformer/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/kv-cache/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/activations/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/memory/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/trainig/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/nanoformer/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/attention/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/transformer/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/ffnn/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/math/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/gpu/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/parallelism/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/vllm/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/tensor-parallelism/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/pipeline-parallelism/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/data-parallelism/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/mixture-of-experts/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/training/</loc>
</url>
<url>
<loc>https://datta0.github.io/tags/finetuning/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/lora/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/fine-tuning/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/llm/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/transformer/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/architectures/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/attention/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/ffnn/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/math/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/gpu/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/parallelism/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/vllm/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/inference/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/mixture-of-experts/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/training/</loc>
</url>
<url>
<loc>https://datta0.github.io/categories/finetuning/</loc>
</url>
</urlset>
