<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml"><url>
    <loc>https://ashwinms.com/Blogs/Backprop-=-chain-of-VJP's!</loc>
    <lastmod>2025-12-12T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Blogs/Context-Tracker-Assistant</loc>
    <lastmod>2024-11-10T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Blogs/Why-your-Model-isn't-Learning</loc>
    <lastmod>2026-02-09T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Blogs/You-think-you-knew-Dropouts-</loc>
    <lastmod>2026-02-16T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Builds/Context-Tracker</loc>
    <lastmod>2024-11-11T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Builds/Deeply-Learning</loc>
    <lastmod>2026-02-01T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Builds/Go-Kafka-Consumer</loc>
    <lastmod>2022-08-24T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Builds/HNews-Radio</loc>
    <lastmod>2025-04-06T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Builds/Kt-Doorman-Client</loc>
    <lastmod>2024-08-21T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Builds/Paper-Tracker</loc>
    <lastmod>2026-01-04T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Builds/SO-101-Lerobot-'25</loc>
    <lastmod>2025-07-06T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Builds/Seq2Seq-Transformer-to-Decipher-Caesar</loc>
    <lastmod>2026-02-08T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/CV/Resume</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Me</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Muse/Why-should-you-bet-on-yourself</loc>
    <lastmod>2025-05-05T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/ML-Concepts/An-Overview-Of-Gradient-Descent-Optimization-Algorithms</loc>
    <lastmod>2026-03-02T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/ML-Concepts/On-Optimizers</loc>
    <lastmod>2026-03-02T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/ALiBi</loc>
    <lastmod>2026-02-14T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/Attention-is-All-You-Need</loc>
    <lastmod>2026-01-26T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/Batch-Norm</loc>
    <lastmod>2026-01-15T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/Chinchilla</loc>
    <lastmod>2026-02-15T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/Deepseek-R1</loc>
    <lastmod>2026-01-06T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/GLU-Improves-Transformers</loc>
    <lastmod>2026-02-13T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/LLaMA</loc>
    <lastmod>2026-02-16T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/Language-Models-are-Unsupervised-Multitask-Learners</loc>
    <lastmod>2026-02-11T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/Layer-Norm-in-Transformers</loc>
    <lastmod>2026-02-12T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/Layer-Norm</loc>
    <lastmod>2026-01-19T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/RLPR</loc>
    <lastmod>2026-01-06T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/RNN-Overview</loc>
    <lastmod>2026-01-23T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/RoFormer</loc>
    <lastmod>2026-02-13T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/Rubrics-As-Reward</loc>
    <lastmod>2026-01-08T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Papers/Scaling-Laws-for-Neural-Language-Model</loc>
    <lastmod>2026-02-16T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Notes/Reading-List</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Posts/Build-Idea---My-Boss</loc>
    <lastmod>2026-03-30T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Posts/Side-Quest-MathAcademy</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/1-Lineage-of-the-Transformer</loc>
    <lastmod>2026-02-18T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/2-Implementing-a-Baseline-Model</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/3-Training-GPT-2-with-bigger-data</loc>
    <lastmod>2026-02-24T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/4-Experiments/Experiment-Template</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/4-Experiments/Hyper-Param-Sweep/Experiments-with-Weight-Decay</loc>
    <lastmod>2026-03-02T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/4-Experiments/Hyper-Param-Sweep/LR-vs-Batch-Size-Empirical-Sweep</loc>
    <lastmod>2026-02-27T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/4-Experiments/Hyper-Param-Sweep/</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/4-Experiments/Mem--and--GPU-Exp/Activation-Checkpointing</loc>
    <lastmod>2026-03-07T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/4-Experiments/Mem--and--GPU-Exp/Micro-batching-+-Gradient-Accumulation</loc>
    <lastmod>2026-03-10T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/4-Experiments/Pre-vs-Post-Norms,-With--and--Without-Warmups</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/4-Experiments/</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/Resources</loc>
    <lastmod>2026-02-11T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Baseline/</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Phase_1/Stage-1</loc>
    <lastmod>2026-03-28T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Phase_1/</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Phase_2/</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/Phase_3/</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/TEL/</loc>
    <lastmod>2026-02-11T00:00:00.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Wishlist/Embedable-Widget-for-Hevy</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/Wishlist/Obsidian-Canvas-AI</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url><url>
    <loc>https://ashwinms.com/</loc>
    <lastmod>2026-03-30T20:17:05.000Z</lastmod>
  </url></urlset>