<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://www.jiajunfan.com/posts/2025/10/diversity-collapse-rlhf/</loc>
<lastmod>2025-10-20T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/posts/2025/10/inverse-scaling-audio-llms/</loc>
<lastmod>2025-10-27T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2020-01-01-Critic-PI2-Master-Continuous-Planning-via-Policy-Improvement-with-Path-Integrals-and-Deep-Actor-Critic-Reinforcement-Learning</loc>
<lastmod>2020-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2021-01-01-A-Review-for-Deep-Reinforcement-Learning-in-Atari-Benchmarks-Challenges-and-Solutions</loc>
<lastmod>2021-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2021-01-01-An-Entropy-Regularization-Free-Mechanism-for-Policy-based-Reinforcement-Learning</loc>
<lastmod>2021-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2021-01-01-CASA-A-Bridge-Between-Gradient-of-Policy-Improvement-and-Policy-Evaluation</loc>
<lastmod>2021-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2021-01-01-GDI-Rethinking-What-Makes-Reinforcement-Learning-Different-From-Supervised-Learning</loc>
<lastmod>2021-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2022-01-01-CASA-Bridging-the-Gap-between-Policy-Improvement-and-Policy-Evaluation-with-Conflict-Averse-Policy-Iteration</loc>
<lastmod>2022-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2022-01-01-Entire-Space-Counterfactual-Learning-Tuning-Analytical-Properties-and-Industrial-Applications</loc>
<lastmod>2022-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2022-01-01-Generalized-Data-Distribution-Iteration</loc>
<lastmod>2022-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2023-01-01-Learnable-Behavior-Control</loc>
<lastmod>2023-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2023-06-01-Optimal-Transport-Treatment-Effect</loc>
<lastmod>2023-06-01T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2024-01-01-Efficient-Design-Control-RL</loc>
<lastmod>2024-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2025-01-01-ORW-CFM-W2-ICLR2025</loc>
<lastmod>2025-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2025-01-02-PRANCE-TPAMI</loc>
<lastmod>2025-01-02T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2025-06-01-ADRPO-NeurIPS2025</loc>
<lastmod>2025-06-01T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2025-06-02-VSCL-NeurIPS2025</loc>
<lastmod>2025-06-02T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2025-06-03-ProteinZero</loc>
<lastmod>2025-06-03T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2025-10-01-AC-Flow</loc>
<lastmod>2025-10-01T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2026-01-01-CESAR-ICLR2026</loc>
<lastmod>2026-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/publication/2026-01-02-SP-VLA-ICLR2026</loc>
<lastmod>2026-01-02T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/categories/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/contact/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/cv/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/projects/adrpo/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/projects/cesar/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/projects/orw-cfm-w2/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/projects/ac-flow/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/projects/gdi/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/projects/lbc/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/projects/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/publications/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/blog/reading-papers/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/tags/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/year-archive/</loc>
</url>
<url>
<loc>https://www.jiajunfan.com/files/ACM.pdf</loc>
<lastmod>2026-03-30T07:05:13-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/files/CV.pdf</loc>
<lastmod>2026-03-30T07:05:13-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/files/Graduate_Transcript.pdf</loc>
<lastmod>2026-03-30T07:05:13-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/files/Undergraduate_Transcript.pdf</loc>
<lastmod>2026-03-30T07:05:13-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/google2c5588c3ec07157e.html</loc>
<lastmod>2026-03-30T07:05:13-07:00</lastmod>
</url>
<url>
<loc>https://www.jiajunfan.com/googleafbef25d80bb49e9.html</loc>
<lastmod>2026-03-30T07:05:13-07:00</lastmod>
</url>
</urlset>
