<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://jerryzyc.github.io/learning/2024/11/01/learning-ppo-tricks.html</loc>
<lastmod>2024-11-01T00:00:00+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/2024/11/02/learning-domain-randomization.html</loc>
<lastmod>2024-11-02T00:00:00+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/2024/11/05/skills-robot-learning-roadmap.html</loc>
<lastmod>2024-11-05T00:00:00+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/work/2024/11/06/work-grasping-retrospective.html</loc>
<lastmod>2024-11-06T00:00:00+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/paper/2026/01/12/paper-sru-nav-rl.html</loc>
<lastmod>2026-01-12T00:00:00+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/paper/2026/01/13/paper-diffusion-policy.html</loc>
<lastmod>2026-01-13T00:00:00+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/paper/2026/01/13/paper-flying-point-clouds-rl.html</loc>
<lastmod>2026-01-13T00:00:00+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/paper/2026/01/13/paper-wmp-locomotion.html</loc>
<lastmod>2026-01-13T00:00:00+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/math-formula-rendering/SKILL.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/paper-reading-blog-generator/SKILL.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/permission-operations/SKILL.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/about/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/categories/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning-notes/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/notes/templates/paper-note-template.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/paper-notes/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/search/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/tags/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/notes/templates/work-project-template.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/work-projects/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/docs/writing-guide.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/cross-cutting-concepts/generalization/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/cross-cutting-concepts/information-theory/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/cross-cutting-concepts/optimization-theory/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/cross-cutting-concepts/probability-review/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/cross-cutting-concepts/research-best-practices/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/architectures/attention-mechanism/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/architectures/cnn/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/architectures/lstm-gru/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/architectures/mlp/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/architectures/rnn/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/architectures/transformer/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/dl-in-practice/debugging/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/dl-in-practice/deployment-considerations/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/dl-in-practice/overfitting/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/dl-in-practice/scaling-laws/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/foundations/activation-functions/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/foundations/backpropagation/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/foundations/loss-functions/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/foundations/perceptron/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/representation-learning/autoencoders/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/representation-learning/contrastive-learning/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/representation-learning/self-supervised/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/representation-learning/vae/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/training/generalization/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/training/initialization/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/training/normalization/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/training/optimization-tricks/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/deep-learning/training/regularization/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/classical-models/gaussian-mixture/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/classical-models/kmeans/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/classical-models/linear-regression/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/classical-models/logistic-regression/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/classical-models/svm/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/fundamentals/bias-variance/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/fundamentals/evaluation-metrics/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/fundamentals/problem-types/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/fundamentals/train-test-split/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/fundamentals/what-is-ml/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/ml-in-practice/data-leakage/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/ml-in-practice/failure-cases/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/ml-in-practice/feature-engineering/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/ml-in-practice/hyperparameter-tuning/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/optimization/convexity/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/optimization/gradient-descent/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/optimization/numerical-stability/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/optimization/regularization/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/probabilistic-ml/bayesian-inference/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/probabilistic-ml/em-algorithm/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/probabilistic-ml/graphical-models/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/machine-learning/probabilistic-ml/mle-map/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/advanced-topics/credit-assignment/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/advanced-topics/memory-recurrence/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/advanced-topics/multi-agent-rl/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/advanced-topics/off-policy/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/advanced-topics/stability-issues/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/deep-rl/actor-critic/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/deep-rl/dqn/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/deep-rl/policy-gradient/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/deep-rl/ppo/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/deep-rl/sac/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/dynamic-programming/policy-evaluation/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/dynamic-programming/policy-iteration/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/dynamic-programming/value-iteration/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/fundamentals/exploration-exploitation/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/fundamentals/mdp/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/fundamentals/policy-value/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/fundamentals/pomdp/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/fundamentals/return-discount/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/model-free-rl/monte-carlo/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/model-free-rl/q-learning/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/model-free-rl/sarsa/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/model-free-rl/td-learning/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/rl-in-practice/curriculum-learning/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/rl-in-practice/failure-analysis/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/rl-in-practice/reward-design/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/learning/reinforcement-learning/rl-in-practice/sim2real/</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/notes/raw.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/article-quality-check/SKILL.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/blog-health-check/SKILL.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/cross-article-consistency/SKILL.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/paper-to-blog-refactor/SKILL.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/personal-learning-knowledge-graph/SKILL.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/skills/safe-dependency-update/SKILL.html</loc>
</url>
<url>
<loc>https://jerryzyc.github.io/assets/papers/diffusion-policy.pdf</loc>
<lastmod>2026-01-14T20:30:01+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/assets/papers/flying-point-clouds-rl.pdf</loc>
<lastmod>2026-01-14T20:30:01+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/assets/papers/sru-nav-rl.pdf</loc>
<lastmod>2026-01-14T20:30:01+08:00</lastmod>
</url>
<url>
<loc>https://jerryzyc.github.io/assets/papers/wmp-locomotion.pdf</loc>
<lastmod>2026-01-14T20:30:01+08:00</lastmod>
</url>
</urlset>
