<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://sreejeetm1729.github.io/posts/why-vanilla-q-learning-breaks-under-corrupted-rewards/</loc>
<lastmod>2026-04-12T23:15:00+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/posts/why-gradient-descent-works/</loc>
<lastmod>2026-05-12T04:00:00+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/posts/stochastic-gradient-descent/</loc>
<lastmod>2026-05-13T00:00:00+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/posts/td-without-projection/</loc>
<lastmod>2026-05-26T00:00:00+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/posts/function-approximation-rl/</loc>
<lastmod>2026-05-27T05:00:00+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/posts/neural_td/</loc>
<lastmod>2026-06-02T00:00:00+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/Who-am-I/</loc>
<lastmod>2026-06-04T07:03:51+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/Research/</loc>
<lastmod>2026-06-04T07:03:51+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/Publications/</loc>
<lastmod>2026-06-04T07:03:51+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/Recent-News/</loc>
<lastmod>2026-06-04T07:03:51+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/RL-Blogs/</loc>
<lastmod>2026-06-04T07:03:51+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/Resume/</loc>
<lastmod>2026-06-04T07:03:51+00:00</lastmod>
</url>
<url>
<loc>https://sreejeetm1729.github.io/categories/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/reinforcement-learning/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/robust-rl/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/q-learning/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/corruption/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/theory/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/optimization/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/gradient-descent/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/machine-learning/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/stochastic-gradient-descent/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/td-learning/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/function-approximation/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/markovian-sampling/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/stochastic-approximation/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/rl/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/function-approximation/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/deep-rl/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/neural-networks/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/temporal-difference-learning/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/neural-td/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/tags/overparameterization/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/categories/rl-blogs/</loc>
</url>
<url>
<loc>https://sreejeetm1729.github.io/assets/pdf/2026_Resume.pdf</loc>
<lastmod>2026-06-04T07:03:38+00:00</lastmod>
</url>
</urlset>
