<?xml version="1.0" encoding="utf-8" standalone="yes"?><urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml"><url><loc>http://baichenjia.cn/publication/active-sampling-for-deep-q-learning/</loc><lastmod>2019-03-10T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/obtaining-accurate-estimated-action-values/</loc><lastmod>2020-03-06T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/generating-attentive-goals/</loc><lastmod>2020-03-08T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/variational-dynamic-for-self-supervised-exploration/</loc><lastmod>2021-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/addressing-hindsight-bias/</loc><lastmod>2021-03-10T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/principled-exploration/</loc><lastmod>2021-03-11T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/dynamic-bottleneck/</loc><lastmod>2021-03-12T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/pessimistic-bootstrapping/</loc><lastmod>2022-03-13T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/exploration-in-deep-reinforcement-learning/</loc><lastmod>2022-03-14T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/monotonic-quantile-network/</loc><lastmod>2022-03-15T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/contrastive-ucb/</loc><lastmod>2022-03-15T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/self-supervised-imitation/</loc><lastmod>2022-03-16T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/rorl/</loc><lastmod>2022-03-17T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/false-correlation-reduction/</loc><lastmod>2023-03-18T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/diverse-randomized-value-functions/</loc><lastmod>2023-03-18T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/becl/</loc><lastmod>2023-03-19T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/pessimistic-value-iteration/</loc><lastmod>2023-03-20T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/ensemble-successor-representations/</loc><lastmod>2023-03-21T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/cross-domain-policy-adaptation-via-value-guided/</loc><lastmod>2023-03-23T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/diffusion-model-is-an-effective-planner/</loc><lastmod>2023-03-24T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/towards-robust-offline-to-online-reinforcement-learning/</loc><lastmod>2023-08-25T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/ovd-explorer/</loc><lastmod>2024-03-26T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/robust-quadrupedal-locomotion/</loc><lastmod>2024-03-27T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/skill-matters/</loc><lastmod>2024-03-28T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/cross-domain-policy-adaptation-by-capturing/</loc><lastmod>2024-03-30T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/how-does-goal-relabeling/</loc><lastmod>2024-04-01T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/sam-e/</loc><lastmod>2024-05-10T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/contrastive-representation-for-data-filtering/</loc><lastmod>2024-05-10T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/constrained-ensemble-exploration/</loc><lastmod>2024-04-30T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/selfbc/</loc><lastmod>2024-07-01T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/privileged-knowledge-distillation/</loc><lastmod>2023-01-01T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/large-scale-actionless/</loc><lastmod>2024-02-22T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/regularized-conditional-diffusion/</loc><lastmod>2024-04-07T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/a-benchmark-for-off-dynamics-reinforcement-learning/</loc><lastmod>2023-03-19T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/provably-efficient-information-directed/</loc><lastmod>2024-04-30T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/forward-kl-regularized-preference-optimization-for-aligning-diffusion-policies/</loc><lastmod>2024-09-16T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/radiology-report-generation-via-multi-objective-preference-optimization/</loc><lastmod>2024-09-16T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/decentralized-transformers-with-centralized-aggregation/</loc><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/exponential-topology-enabled-scalable-communication/</loc><lastmod>2024-12-16T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/discriminator-guided-embodied-planning/</loc><lastmod>2024-12-16T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/online-preference-alignment-for-language-models/</loc><lastmod>2024-12-16T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/on-the-value-of-myopic-behavior/</loc><lastmod>2023-08-22T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/task-agnostic-pre-training-and-task-guided-fine-tuning-for-versatile-diffusion-planner/</loc><lastmod>2023-03-19T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/towards-efficient-llm/</loc><lastmod>2024-05-23T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/oisa-rrg/</loc><lastmod>2024-05-23T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/preference-aligned-diffusion-planner-for-quadrupedal-locomotion-control/</loc><lastmod>2024-10-19T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/embodied-survey/</loc><lastmod>2023-07-31T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/vision-language-preference-learning-for-embodied-manipulation/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/distributional-off-policy-evaluation-in-reinforcement-learning/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/humanoid-whole-body-locomotion/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/information-rlhf/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/adversarial-locomotion-and-motion-imitation-for-humanoid-policy-learning/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/revisiting-multi-agent-world-modeling-from-a-diffusion-inspired-perspective/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/towards-reliable-llm-based-robots-planning/</loc><lastmod>2024-05-19T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/humanoidgen/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/kungfubot/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/mixture-of-residual-experts-for-humanoid-lifelike-gaits-learning-on-complex-terrains/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/learn-as-individuals/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/towards-a-generalizable-bimanual-foundation-policy-via-flow-based-video-prediction/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/towards-adaptive-humanoid-control-via-multi-behavior-distillation-and-reinforced-fine-tuning/</loc><lastmod>2024-09-01T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/cross-domain-offline-policy-adaptation-with-dynamics--and-value-aligned-data-filtering/</loc><lastmod>2025-12-02T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/kungfubot2/</loc><lastmod>2023-09-27T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/align-then-steer/</loc><lastmod>2026-01-01T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/steering-vision-language-action-models-as-anti-exploration/</loc><lastmod>2025-12-02T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/learning-soccer-skills-for-humanoid-robots---a-progressive-perception-action-framework/</loc><lastmod>2026-02-05T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/textop---real-time-interactive-text-driven-humanoid-robot-motion-generation-and-control/</loc><lastmod>2026-02-12T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/husky---humanoid-skateboarding-system-via-physics-aware-whole-body-control/</loc><lastmod>2026-02-03T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/pro-hoi/</loc><lastmod>2026-03-01T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/x-loco/</loc><lastmod>2026-03-04T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/beyond-short-horizon/</loc><lastmod>2026-03-17T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/halo/</loc><lastmod>2026-03-19T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication-type/preprint/</loc><lastmod>2026-03-19T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication_types/</loc><lastmod>2026-03-19T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication/</loc><lastmod>2026-03-19T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/control/</loc><lastmod>2026-02-05T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/humanoid/</loc><lastmod>2026-02-05T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/perception/</loc><lastmod>2026-02-05T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/preprint/</loc><lastmod>2026-02-05T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/robotics/</loc><lastmod>2026-02-05T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tags/</loc><lastmod>2026-02-05T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/dynamics/</loc><lastmod>2026-02-03T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/whole-body-control/</loc><lastmod>2026-02-03T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication-type/conference/</loc><lastmod>2026-01-01T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication-type/journal/</loc><lastmod>2025-12-02T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication-type/article-journal/</loc><lastmod>2024-04-30T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/post/blog-with-jupyter/</loc><lastmod>2023-11-04T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/post/</loc><lastmod>2023-11-04T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/publication-type/under-review/</loc><lastmod>2023-03-09T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/</loc><lastmod>2022-10-24T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/contact/</loc><lastmod>2022-10-24T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/people/</loc><lastmod>2022-10-24T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/academic/</loc><lastmod>2020-12-13T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/categories/</loc><lastmod>2020-12-13T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/category/demo/</loc><lastmod>2020-12-13T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/post/getting-started/</loc><lastmod>2020-12-13T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/%E5%BC%80%E6%BA%90/</loc><lastmod>2020-12-13T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/category/%E6%95%99%E7%A8%8B/</loc><lastmod>2020-12-13T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/post/writing-technical-content/</loc><lastmod>2019-07-12T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/slides/</loc><lastmod>2019-02-05T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/slides/example/</loc><lastmod>2019-02-05T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/deep-learning/</loc><lastmod>2016-04-27T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/tag/demo/</loc><lastmod>2016-04-27T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/project/example/</loc><lastmod>2016-04-27T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/project/external-project/</loc><lastmod>2016-04-27T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/project/</loc><lastmod>2016-04-27T00:00:00+00:00</lastmod><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/book/</loc><changefreq>weekly</changefreq></url><url><loc>http://baichenjia.cn/book/example/</loc><changefreq>weekly</changefreq></url></urlset>