<?xml version="1.0" encoding="utf-8" standalone="yes"?><rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom"><channel><title>1 | PAIR Lab: PKU Alignment and Interaction Research Lab</title><link>https://pair-lab.ai/publication-type/1/</link><atom:link href="https://pair-lab.ai/publication-type/1/index.xml" rel="self" type="application/rss+xml"/><description>1</description><generator>Hugo Blox Builder (https://hugoblox.com)</generator><language>en-us</language><lastBuildDate>Thu, 03 Jul 2025 00:00:00 +0000</lastBuildDate><image><url>https://pair-lab.ai/media/icon_hu4f2a7092ab9dace538e8dee71ba34a1a_30036_512x512_fill_lanczos_center_3.png</url><title>1</title><link>https://pair-lab.ai/publication-type/1/</link></image><item><title>Benchmarking Multi-national Value Alignment for Large Language Models</title><link>https://pair-lab.ai/publication/acl_2025_2/</link><pubDate>Thu, 03 Jul 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/acl_2025_2/</guid><description/></item><item><title>PKU-safeRLHF: Towards Multi-level Safety Alignment for LLMs with Human Preference</title><link>https://pair-lab.ai/publication/acl_2025_3/</link><pubDate>Thu, 03 Jul 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/acl_2025_3/</guid><description/></item><item><title>Differentiable Information Enhanced Model-Based Reinforcement Learning</title><link>https://pair-lab.ai/publication/aaai_2025/</link><pubDate>Thu, 03 Apr 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2025/</guid><description/></item><item><title>Distributed Policy Space Response Oracles in Two-Player Zero-Sum Games</title><link>https://pair-lab.ai/publication/ieee_2025/</link><pubDate>Thu, 03 Apr 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/ieee_2025/</guid><description/></item><item><title>Magnetic Preference Optimization: Achieving Last-iterate Convergence for Language Model Alignment</title><link>https://pair-lab.ai/publication/iclr_2025_2/</link><pubDate>Thu, 03 Apr 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2025_2/</guid><description/></item><item><title>Rat: Adversarial Attacks on Deep Reinforcement Agents for Targeted Behaviors</title><link>https://pair-lab.ai/publication/aaai_2025_3/</link><pubDate>Thu, 03 Apr 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2025_3/</guid><description/></item><item><title>Towards Efficient Collaboration Via Graph Modeling In Reinforcement Learning</title><link>https://pair-lab.ai/publication/aaai_2025_2/</link><pubDate>Thu, 03 Apr 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2025_2/</guid><description/></item><item><title>Differentiable Information Enhanced Model-Based Reinforcement Learning</title><link>https://pair-lab.ai/publication/aaai_2025_oral_1/</link><pubDate>Mon, 03 Mar 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2025_oral_1/</guid><description/></item><item><title>Falcon: Fast Visuomotor Policies via Partial Denoising</title><link>https://pair-lab.ai/publication/icml_2025/</link><pubDate>Mon, 03 Mar 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2025/</guid><description/></item><item><title>Sequence to Sequence Reward Modeling: Improving RLHF by Language Feedback</title><link>https://pair-lab.ai/publication/aaai_2025_oral_2/</link><pubDate>Mon, 03 Mar 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2025_oral_2/</guid><description/></item><item><title>Amulet: ReAlignment During Test Time for Personalized Preference Adaptation of LLMs</title><link>https://pair-lab.ai/publication/iclr_2025/</link><pubDate>Wed, 26 Feb 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2025/</guid><description/></item><item><title>SAE-V: Interpreting Multimodal Models for Enhanced Alignment</title><link>https://pair-lab.ai/publication/icml_2025_2/</link><pubDate>Mon, 03 Feb 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2025_2/</guid><description/></item><item><title>Stream Aligner: Efficient Sentence-Level Alignment via Distribution Induction</title><link>https://pair-lab.ai/publication/aaai_2025_alignment/</link><pubDate>Thu, 09 Jan 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2025_alignment/</guid><description/></item><item><title>Mitigating Reward Over-Optimization in RLHF via Behavior-Supported Regularization</title><link>https://pair-lab.ai/publication/iclr_2025_3/</link><pubDate>Fri, 03 Jan 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2025_3/</guid><description/></item><item><title>Safesora: Towards Safety Alignment of Text2video Generation via a Human Preference Dataset</title><link>https://pair-lab.ai/publication/nips_2025_2/</link><pubDate>Fri, 03 Jan 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nips_2025_2/</guid><description/></item><item><title>Scalable Constrained Policy Optimization for Safe Multi-agent Reinforcement Learning</title><link>https://pair-lab.ai/publication/nips_2025/</link><pubDate>Fri, 03 Jan 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nips_2025/</guid><description/></item><item><title>JARVIS-1: Open-World Multi-task Agents with Memory-Augmented Multimodal Language Models</title><link>https://pair-lab.ai/publication/pami/</link><pubDate>Thu, 05 Dec 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/pami/</guid><description/></item><item><title>Aligner: Efficient Alignment by Learning to Correct</title><link>https://pair-lab.ai/publication/nips_2024_oral/</link><pubDate>Thu, 26 Sep 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nips_2024_oral/</guid><description/></item><item><title>Panacea: Pareto Alignment via Preference Adaptation for LLMs</title><link>https://pair-lab.ai/publication/nips_2024/</link><pubDate>Thu, 26 Sep 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nips_2024/</guid><description/></item><item><title>Neural Attention Field: Emerging Point Relevance in 3D Scenes for One-Shot Dexterous Grasping</title><link>https://pair-lab.ai/publication/corl_2024/</link><pubDate>Fri, 06 Sep 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/corl_2024/</guid><description/></item><item><title>Off-Agent Trust Region Policy Optimization</title><link>https://pair-lab.ai/publication/ijcai_2024/</link><pubDate>Sat, 03 Aug 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/ijcai_2024/</guid><description/></item><item><title>ProgressGym: Alignment with a Millennium of Moral Progress</title><link>https://pair-lab.ai/publication/nips_2024_db_spotlight/</link><pubDate>Sat, 03 Aug 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nips_2024_db_spotlight/</guid><description/></item><item><title>Efficient Adaptation in Mixed-Motive Environments via Hierarchical Opponent Modeling and Planning</title><link>https://pair-lab.ai/publication/icml_2024_2/</link><pubDate>Fri, 12 Jul 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2024_2/</guid><description/></item><item><title>In-Context Editing: Learning Knowledge from Self-Induced Distributions</title><link>https://pair-lab.ai/publication/iclr_2025_4/</link><pubDate>Mon, 03 Jun 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2025_4/</guid><description/></item><item><title>Language models resist alignment: Evidence from data compression</title><link>https://pair-lab.ai/publication/acl_2025_best_paper/</link><pubDate>Mon, 03 Jun 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/acl_2025_best_paper/</guid><description/></item><item><title>Remember the Past for Better Future: Memory-Augmented Offline RL</title><link>https://pair-lab.ai/publication/ieee_2024/</link><pubDate>Mon, 03 Jun 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/ieee_2024/</guid><description/></item><item><title>Anyskill: Learning Open-Vocabulary Physical Skill for Interactive Agents</title><link>https://pair-lab.ai/publication/cvpr_2024/</link><pubDate>Sun, 19 May 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/cvpr_2024/</guid><description/></item><item><title>End-to-End Neuro-Symbolic Reinforcement Learning with Textual Explanations</title><link>https://pair-lab.ai/publication/icml_2024_1/</link><pubDate>Thu, 02 May 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2024_1/</guid><description/></item><item><title>A Perspective of Q-value Estimation on Offline-to-Online Reinforcement Learning</title><link>https://pair-lab.ai/publication/aaai_2024_2/</link><pubDate>Wed, 06 Mar 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2024_2/</guid><description/></item><item><title>Grasp Multiple Objects with One Hand</title><link>https://pair-lab.ai/publication/ral_2024/</link><pubDate>Wed, 06 Mar 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/ral_2024/</guid><description/></item><item><title>ProAgent: Building Proactive Cooperative Agents with Large Language Models</title><link>https://pair-lab.ai/publication/aaai_2024_oral/</link><pubDate>Sun, 03 Mar 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2024_oral/</guid><description/></item><item><title>STAS: Spatial-Temporal Return Decomposition for Multi-agent Reinforcement Learning</title><link>https://pair-lab.ai/publication/aaai_2024_1/</link><pubDate>Tue, 06 Feb 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2024_1/</guid><description/></item><item><title>CivRealm: A Learning and Reasoning Odyssey in Civilization for Decision-Making Agents</title><link>https://pair-lab.ai/publication/iclr24_spotlight_2/</link><pubDate>Mon, 01 Jan 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr24_spotlight_2/</guid><description/></item><item><title>Maximum Entropy Heterogeneous-Agent Reinforcement Learning</title><link>https://pair-lab.ai/publication/iclr24_spotlight/</link><pubDate>Mon, 01 Jan 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr24_spotlight/</guid><description/></item><item><title>BeaverTails: A Human-Preference Dataset for LLM Harmlessness Alignment</title><link>https://pair-lab.ai/publication/neurips23db_2/</link><pubDate>Tue, 30 May 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips23db_2/</guid><description/></item><item><title>Safety Gymnasium: A Unified Safe Reinforcement Learning Benchmark</title><link>https://pair-lab.ai/publication/neurips23db_1/</link><pubDate>Tue, 30 May 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips23db_1/</guid><description/></item><item><title>Unidexgrasp++: Improving Dexterous Grasping Policy Learning via Geometry-Aware Curriculum and Iterative Generalist-Specialist Learning</title><link>https://pair-lab.ai/publication/iccv23/</link><pubDate>Thu, 04 May 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iccv23/</guid><description/></item><item><title>GEAR: A GPU-Centric Experience Replay System for Large Reinforcement Learning Models</title><link>https://pair-lab.ai/publication/icml_2023_4/</link><pubDate>Tue, 25 Apr 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2023_4/</guid><description/></item><item><title>A Game-Theoretic Framework for Managing Risk in Multi-Agent Systems</title><link>https://pair-lab.ai/publication/icml_2023_3/</link><pubDate>Mon, 24 Apr 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2023_3/</guid><description/></item><item><title>Regret-Minimizing Double Oracle for Extensive-Form Games</title><link>https://pair-lab.ai/publication/icml_2023_1/</link><pubDate>Thu, 20 Apr 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2023_1/</guid><description/></item><item><title>MANSA: Learning Fast and Slow in Multi-Agent Systems</title><link>https://pair-lab.ai/publication/icml_2023_2/</link><pubDate>Sun, 12 Feb 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2023_2/</guid><description/></item><item><title>Learning to Shape Rewards using a Game of Two Partners</title><link>https://pair-lab.ai/publication/aaai_2023_1/</link><pubDate>Mon, 06 Feb 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2023_1/</guid><description/></item><item><title>Quality-Similar Diversity via Population Based Reinforcement Learning</title><link>https://pair-lab.ai/publication/iclr_2023/</link><pubDate>Thu, 02 Feb 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2023/</guid><description/></item><item><title>A Game-Theoretic Approach to Multi-agent Trust Region Optimization</title><link>https://pair-lab.ai/publication/dai/</link><pubDate>Thu, 15 Dec 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/dai/</guid><description/></item><item><title>ACE: Cooperative Multi-agent Q-learning with Bidirectional Action-Dependency</title><link>https://pair-lab.ai/publication/aaai_2023_2/</link><pubDate>Tue, 29 Nov 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2023_2/</guid><description/></item><item><title>Contextual Transformer for Offline Meta Reinforcement Learning</title><link>https://pair-lab.ai/publication/nips_workshop_2/</link><pubDate>Tue, 15 Nov 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nips_workshop_2/</guid><description/></item><item><title>TorchOpt: An Efficient Library for Differentiable Optimization</title><link>https://pair-lab.ai/publication/nips_workshop_1/</link><pubDate>Sun, 13 Nov 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nips_workshop_1/</guid><description/></item><item><title>Scalable Model-based Policy Optimization for Decentralized Networked Systems</title><link>https://pair-lab.ai/publication/iros_2022/</link><pubDate>Sun, 23 Oct 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iros_2022/</guid><description/></item><item><title>GenDexGrasp: Generalizable Dexterous Grasping</title><link>https://pair-lab.ai/publication/icra_2023_2/</link><pubDate>Mon, 03 Oct 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icra_2023_2/</guid><description/></item><item><title>A Theoretical Understanding of Gradient Bias in Meta-Reinforcement Learning</title><link>https://pair-lab.ai/publication/neurips_2022_2/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_2/</guid><description/></item><item><title>A Unified Diversity Measure for Multiagent Reinforcement Learning</title><link>https://pair-lab.ai/publication/neurips_2022_5/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_5/</guid><description/></item><item><title>Constrained Update Projection Approach to Safe Policy Optimization</title><link>https://pair-lab.ai/publication/neurips_2022_3/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_3/</guid><description/></item><item><title>MATE: Benchmarking Multi-Agent Reinforcement Learning in Distributed Target Coverage Control</title><link>https://pair-lab.ai/publication/neurips_2022_7/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_7/</guid><description/></item><item><title>Meta-Reward-Net: Implicitly Differentiable Reward Learning for Preference-based Reinforcement Learning</title><link>https://pair-lab.ai/publication/neurips_2022_1/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_1/</guid><description/></item><item><title>Towards Human-Level Bimanual Dexterous Manipulation with Reinforcement Learning</title><link>https://pair-lab.ai/publication/neurips_2022_6/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_6/</guid><description/></item><item><title>End-to-End Affordance Learning for Robotic Manipulation</title><link>https://pair-lab.ai/publication/icra_2023_1/</link><pubDate>Mon, 26 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icra_2023_1/</guid><description/></item><item><title>Debias the Black-Box: A Fair Ranking Framework via Knowledge Distillation</title><link>https://pair-lab.ai/publication/wise_2022/</link><pubDate>Wed, 24 Aug 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/wise_2022/</guid><description/></item><item><title>Multi-Agent Reinforcement Learning is a Sequence Modeling Problem</title><link>https://pair-lab.ai/publication/neurips_2022_4/</link><pubDate>Mon, 30 May 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_4/</guid><description/></item><item><title>On the Convergence of Fictitious Play: A Decomposition Approach</title><link>https://pair-lab.ai/publication/ijcai_2021/</link><pubDate>Tue, 03 May 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/ijcai_2021/</guid><description/></item><item><title>Neural Auto-Curricula in Two-Player Zero-Sum Games</title><link>https://pair-lab.ai/publication/neurips2021_1/</link><pubDate>Mon, 06 Dec 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips2021_1/</guid><description/></item><item><title>LIGS: Learnable Intrinsic-Reward Generation Selection for Multi-Agent Learning</title><link>https://pair-lab.ai/publication/iclr_2022_1/</link><pubDate>Sun, 05 Dec 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2022_1/</guid><description/></item><item><title>Trust Region Policy Optimisation in Multi-Agent Reinforcement Learning</title><link>https://pair-lab.ai/publication/iclr_2022_2/</link><pubDate>Thu, 23 Sep 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2022_2/</guid><description/></item><item><title>Settling the Variance of Multi-Agent Policy Gradients</title><link>https://pair-lab.ai/publication/neurips2021_3/</link><pubDate>Thu, 19 Aug 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips2021_3/</guid><description/></item><item><title>Towards Unifying Behavioral and Response Diversity for Open-ended Learning in Zero-sum Games</title><link>https://pair-lab.ai/publication/neurips2021_2/</link><pubDate>Wed, 09 Jun 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips2021_2/</guid><description/></item></channel></rss>