<?xml version="1.0" encoding="UTF-8"?> <urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"> <url> <loc>https://smasoudrezvani.github.io/blog/2026/muon-optimizer/</loc> <lastmod>2026-03-30T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Causal-Inference-and-Impact-Evaluation/</loc> <lastmod>2026-03-31T12:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/RL-intro/</loc> <lastmod>2026-04-01T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Armed-Bandit/</loc> <lastmod>2026-04-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Tabular-methods/</loc> <lastmod>2026-04-03T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/RL-stability-tests/</loc> <lastmod>2026-04-06T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Sarsa-vs.-qlearning/</loc> <lastmod>2026-04-06T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Function-approximation/</loc> <lastmod>2026-04-07T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/PPO,-GRPO,-and-DPO/</loc> <lastmod>2026-04-08T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Policy-Gradient/</loc> <lastmod>2026-04-08T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Game-theory-intro/</loc> <lastmod>2026-04-20T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Bayesian-Games/</loc> <lastmod>2026-04-21T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Extensive-Games/</loc> <lastmod>2026-04-21T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Mixed-Strategies/</loc> <lastmod>2026-04-21T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/Nash-Equilibrium/</loc> <lastmod>2026-04-21T00:00:00+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/projects/1_docvqa/</loc> <lastmod>2026-04-22T18:02:52+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/projects/2_semart/</loc> <lastmod>2026-04-22T18:02:52+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/projects/3_ml_dashboard/</loc> <lastmod>2026-04-22T18:02:52+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/projects/4_llm_fraud/</loc> <lastmod>2026-04-22T18:02:52+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/projects/5_s3_minio/</loc> <lastmod>2026-04-22T18:02:52+00:00</lastmod> </url> <url> <loc>https://smasoudrezvani.github.io/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/books/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/cv/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/_pages/dropdown/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/news/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/notes/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/people/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/projects/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/publications/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/repositories/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/notes/game-theory/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/notes/ml-papers/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/notes/reinforcement-learning/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/teaching/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/2026/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/optimization/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/machine-learning/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/muon/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/adamw/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/llm/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/data-science/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/causal-inference/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/impact-evaluation/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/reinforcement-learning/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/ai/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/dpo/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/multi-armed-bandit/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/mdp/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/sarsa/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/q-learning/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/mlops/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/deep-learning/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/deep-rl/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/ppo/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/grpo/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/policy-gradients/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/actor-critic/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/game-theory/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/economics/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/mathematics/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/nash-equilibrium/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/bayesian-games/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/incomplete-information/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/auctions/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/extensive-form/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/backward-induction/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/subgame-perfect/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/mixed-strategies/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/tag/prisoner-dilemma/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/category/ml-papers/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/category/reinforcement-learning/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/category/ai-research/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/category/game-theory/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/books/2024/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/books/tag/top-100/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/books/category/classics/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/books/category/crime/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/books/category/historical-fiction/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/books/category/mystery/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/books/category/novels/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/books/category/thriller/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/page/2/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/blog/page/3/</loc> </url> <url> <loc>https://smasoudrezvani.github.io/google2deddea92ec8de21.html</loc> <lastmod>2026-04-22T18:02:00+00:00</lastmod> </url> </urlset>