<?xml version="1.0" encoding="utf-8" standalone="yes"?><rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom"><channel><title>Reinforcement Learning | PAIR Lab: PKU Alignment and Interaction Research Lab</title><link>https://pair-lab.ai/tag/reinforcement-learning/</link><atom:link href="https://pair-lab.ai/tag/reinforcement-learning/index.xml" rel="self" type="application/rss+xml"/><description>Reinforcement Learning</description><generator>Hugo Blox Builder (https://hugoblox.com)</generator><language>en-us</language><lastBuildDate>Thu, 03 Jul 2025 00:00:00 +0000</lastBuildDate><image><url>https://pair-lab.ai/media/icon_hu4f2a7092ab9dace538e8dee71ba34a1a_30036_512x512_fill_lanczos_center_3.png</url><title>Reinforcement Learning</title><link>https://pair-lab.ai/tag/reinforcement-learning/</link></image><item><title>ReDMan: Reliable Dexterous Manipulation with Safe Reinforcement Learning</title><link>https://pair-lab.ai/publication/ml_2025/</link><pubDate>Thu, 03 Jul 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/ml_2025/</guid><description/></item><item><title>Remember the Past for Better Future: Memory-Augmented Offline RL</title><link>https://pair-lab.ai/publication/ieee_2024/</link><pubDate>Mon, 03 Jun 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/ieee_2024/</guid><description/></item><item><title>Grasp Multiple Objects with One Hand</title><link>https://pair-lab.ai/publication/ral_2024/</link><pubDate>Wed, 06 Mar 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/ral_2024/</guid><description/></item><item><title>CivRealm: A Learning and Reasoning Odyssey in Civilization for Decision-Making Agents</title><link>https://pair-lab.ai/publication/iclr24_spotlight_2/</link><pubDate>Mon, 01 Jan 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr24_spotlight_2/</guid><description/></item><item><title>GEAR: A GPU-Centric Experience Replay System for Large Reinforcement Learning Models</title><link>https://pair-lab.ai/publication/icml_2023_4/</link><pubDate>Tue, 25 Apr 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2023_4/</guid><description/></item><item><title>A Deep Reinforcement Learning-driven Vine Copula Method for Correlation Structure Analysis of Mortgage</title><link>https://pair-lab.ai/publication/copula/</link><pubDate>Sat, 01 Apr 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/copula/</guid><description/></item><item><title>Learning to Shape Rewards using a Game of Two Partners</title><link>https://pair-lab.ai/publication/aaai_2023_1/</link><pubDate>Mon, 06 Feb 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2023_1/</guid><description/></item><item><title>Quality-Similar Diversity via Population Based Reinforcement Learning</title><link>https://pair-lab.ai/publication/iclr_2023/</link><pubDate>Thu, 02 Feb 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2023/</guid><description/></item><item><title>Solving Inventory Management Problems through Deep Reinforcement Learning</title><link>https://pair-lab.ai/publication/jss/</link><pubDate>Sat, 10 Dec 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/jss/</guid><description/></item><item><title>MSRL: Distributed Reinforcement Learning with Dataflow Fragments</title><link>https://pair-lab.ai/publication/msrl/</link><pubDate>Mon, 03 Oct 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/msrl/</guid><description/></item><item><title>Meta-Reward-Net: Implicitly Differentiable Reward Learning for Preference-based Reinforcement Learning</title><link>https://pair-lab.ai/publication/neurips_2022_1/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_1/</guid><description/></item><item><title>Towards Human-Level Bimanual Dexterous Manipulation with Reinforcement Learning</title><link>https://pair-lab.ai/publication/neurips_2022_6/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_6/</guid><description/></item><item><title>End-to-End Affordance Learning for Robotic Manipulation</title><link>https://pair-lab.ai/publication/icra_2023_1/</link><pubDate>Mon, 26 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icra_2023_1/</guid><description/></item></channel></rss>