<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://mandliya.github.io/blog/2024/LLM_inference_1/</loc>
<lastmod>2025-12-18T06:57:03+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2024/LLM_inference_2/</loc>
<lastmod>2025-12-18T06:57:03+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2024/scaling_laws/</loc>
<lastmod>2025-12-18T06:57:03+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2024/model_architecture_optimizations/</loc>
<lastmod>2025-12-18T06:57:03+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2025/from-words-to-meaning-implementing-word2vec-from-scratch/</loc>
<lastmod>2025-12-18T06:57:03+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2025/supervised-finetuning-in-llm-training-workflow/</loc>
<lastmod>2025-12-30T07:39:38+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2025/visualizing-attention-see-what-an-llm-sees/</loc>
<lastmod>2025-12-30T07:39:38+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2025/building-gpt-2-from-scratch-mechanistic-interpretability-view/</loc>
<lastmod>2026-01-12T06:30:11+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2025/paper-implementation-steering-language-models-with-activation-engineering/</loc>
<lastmod>2026-01-11T06:55:48+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2025/introduction-to-mechanistic-interpretability-superposition-and-sparse-autoencoders/</loc>
<lastmod>2025-12-25T21:32:48+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2026/deeply-learning-1-dropout-implementation-from-scratch/</loc>
<lastmod>2026-03-11T19:15:40+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2026/deeply-learning-2-cross-entropy-loss-implementation-from-scratch/</loc>
<lastmod>2026-03-11T19:14:53+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2026/deeply-learning-3-mean-squared-error-loss-implementation-from-scratch/</loc>
<lastmod>2026-03-04T23:10:09+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2026/building-an-autograd-engine-from-scratch-with-cupy-part-1-tensor-and-backpropagation/</loc>
<lastmod>2026-03-14T07:14:09+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/blog/2026/deeplygrad-part-2-teaching-our-autograd-to-classify-mnist-digits/</loc>
<lastmod>2026-03-14T00:03:39+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/2024/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/2025/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/2026/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/llm/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/inference-optimization/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/transformer/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/attention-mechanism/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/multi-head-attention/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/k-v-caching/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/memory-calculation/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/optimization-metrics/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/optimization-techniques/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/natural-language-processing/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/nlp/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/large-language-models/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/llms/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/transformers/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/ai-accelerators/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/gpus/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/tpus/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/fpgas/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/asics/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/parallel-processing/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/data-parallelism/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/model-parallelism/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/task-parallelism/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/co-processing-mode/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/intelligent-processing-units/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/reconfigurable-dataflow-units/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/neural-processing-units/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/scaling-laws/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/emergent-capabilities/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/mixture-of-experts/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/group-query-attention/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/gqa/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/moe/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/hardware-acceleration/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/model-architecture-optimizations/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/word-embeddings/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/word2vec/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/embeddings/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/embedding-models/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/deep-learning/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/neural-networks/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/supervised-fine-tuning/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/sft/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/attention/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/mechanistic-interpretability/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/residual-streams/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/ai-safety/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/activation-engineering/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/representation-engineering/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/alignment/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/controlibility/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/repe/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/superposition/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/sparse-autoencoders/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/sae/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/transformerss/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/dropout/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/pytorch/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/regularization/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/cross-entropy/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/loss-functions/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/mean-squared-error/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/autograd/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/backpropagation/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/cupy/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/automatic-differentiation/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/from-scratch/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/tag/mnist/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/large-language-model/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/inference-optimization/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/natural-language-processing/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/ai-accelerators/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/emegent-capabilities/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/nlp/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/large-language-models/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/llms/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/transformers/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/mechanistic-interpretability/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/ai-safety/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/alignment/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/representation-engineering/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/activation-engineering/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/controlibilitynatural-language-processing/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/superposition/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/sparse-autoencoders/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/sae/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/deeply-learning/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/neural-networks/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/category/deep-learning/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/</loc>
</url>
<url>
<loc>https://mandliya.github.io/blog/page/2/</loc>
</url>
<url>
<loc>https://mandliya.github.io/assets/html/relativity.html</loc>
<lastmod>2026-03-14T07:14:24+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/assets/pdf/example_pdf.pdf</loc>
<lastmod>2026-03-14T07:14:25+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/assets/plotly/demo.html</loc>
<lastmod>2026-03-14T07:14:25+00:00</lastmod>
</url>
<url>
<loc>https://mandliya.github.io/assets/rendercv/rendercv_output/Albert_Einstein_CV.pdf</loc>
<lastmod>2026-03-14T07:14:25+00:00</lastmod>
</url>
</urlset>
