<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://anthony0727.github.io/2025/04/09/TD/</loc>
<lastmod>2025-04-09T18:00:00+00:00</lastmod>
</url>
<url>
<loc>https://anthony0727.github.io/2025/04/09/overparameterization/</loc>
<lastmod>2025-04-09T18:00:00+00:00</lastmod>
</url>
<url>
<loc>https://anthony0727.github.io/2025/04/09/TRPO/</loc>
<lastmod>2025-04-09T18:00:00+00:00</lastmod>
</url>
<url>
<loc>https://anthony0727.github.io/2025/04/09/can-we-trust-math/</loc>
<lastmod>2025-04-09T18:00:00+00:00</lastmod>
</url>
<url>
<loc>https://anthony0727.github.io/2025/04/09/state-vs-observation/</loc>
<lastmod>2025-04-09T18:00:00+00:00</lastmod>
</url>
<url>
<loc>https://anthony0727.github.io/2025/04/10/optimality-of-q/</loc>
<lastmod>2025-04-10T17:00:00+00:00</lastmod>
</url>
<url>
<loc>https://anthony0727.github.io/2025/04/10/policy-gradient/</loc>
<lastmod>2025-04-10T17:00:00+00:00</lastmod>
</url>
<url>
<loc>https://anthony0727.github.io/2025/04/10/my-failure-log/</loc>
<lastmod>2025-04-10T18:00:00+00:00</lastmod>
</url>
<url>
<loc>https://anthony0727.github.io/</loc>
</url>
<url>
<loc>https://anthony0727.github.io/assets/anthony_resume_rl.pdf</loc>
<lastmod>2025-04-25T03:13:27+00:00</lastmod>
</url>
</urlset>
