<?xml version="1.0" encoding="utf-8" standalone="yes"?><rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom"><channel><title>Multi-Agent Reinforcement Learning | PAIR Lab: PKU Alignment and Interaction Research Lab</title><link>https://pair-lab.ai/tag/multi-agent-reinforcement-learning/</link><atom:link href="https://pair-lab.ai/tag/multi-agent-reinforcement-learning/index.xml" rel="self" type="application/rss+xml"/><description>Multi-Agent Reinforcement Learning</description><generator>Hugo Blox Builder (https://hugoblox.com)</generator><language>en-us</language><lastBuildDate>Thu, 03 Apr 2025 00:00:00 +0000</lastBuildDate><image><url>https://pair-lab.ai/media/icon_hu4f2a7092ab9dace538e8dee71ba34a1a_30036_512x512_fill_lanczos_center_3.png</url><title>Multi-Agent Reinforcement Learning</title><link>https://pair-lab.ai/tag/multi-agent-reinforcement-learning/</link></image><item><title>TIMAR: Transition-Informed Representation for Sample-Efficient Multi-agent Reinforcement Learning</title><link>https://pair-lab.ai/publication/nn/</link><pubDate>Thu, 03 Apr 2025 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nn/</guid><description/></item><item><title>Safe Multi-agent Reinforcement Learning for Multi-robot Control</title><link>https://pair-lab.ai/publication/aij/</link><pubDate>Thu, 01 Jun 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aij/</guid><description/></item><item><title>A Game-Theoretic Framework for Managing Risk in Multi-Agent Systems</title><link>https://pair-lab.ai/publication/icml_2023_3/</link><pubDate>Mon, 24 Apr 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2023_3/</guid><description/></item><item><title>MANSA: Learning Fast and Slow in Multi-Agent Systems</title><link>https://pair-lab.ai/publication/icml_2023_2/</link><pubDate>Sun, 12 Feb 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/icml_2023_2/</guid><description/></item><item><title>On the Complexity of Computing Markov Perfect Equilibrium in General-Sum Stochastic Games</title><link>https://pair-lab.ai/publication/nsr/</link><pubDate>Sun, 01 Jan 2023 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nsr/</guid><description/></item><item><title>A Game-Theoretic Approach to Multi-agent Trust Region Optimization</title><link>https://pair-lab.ai/publication/dai/</link><pubDate>Thu, 15 Dec 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/dai/</guid><description/></item><item><title>ACE: Cooperative Multi-agent Q-learning with Bidirectional Action-Dependency</title><link>https://pair-lab.ai/publication/aaai_2023_2/</link><pubDate>Tue, 29 Nov 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2023_2/</guid><description/></item><item><title>Scalable Model-based Policy Optimization for Decentralized Networked Systems</title><link>https://pair-lab.ai/publication/iros_2022/</link><pubDate>Sun, 23 Oct 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iros_2022/</guid><description/></item><item><title>A Unified Diversity Measure for Multiagent Reinforcement Learning</title><link>https://pair-lab.ai/publication/neurips_2022_5/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_5/</guid><description/></item><item><title>MATE: Benchmarking Multi-Agent Reinforcement Learning in Distributed Target Coverage Control</title><link>https://pair-lab.ai/publication/neurips_2022_7/</link><pubDate>Wed, 28 Sep 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_7/</guid><description/></item><item><title>Offline Pre-trained Multi-agent Decision Transformer</title><link>https://pair-lab.ai/publication/mir/</link><pubDate>Fri, 10 Jun 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/mir/</guid><description/></item><item><title>Multi-Agent Reinforcement Learning is a Sequence Modeling Problem</title><link>https://pair-lab.ai/publication/neurips_2022_4/</link><pubDate>Mon, 30 May 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips_2022_4/</guid><description/></item><item><title>Neural Auto-Curricula in Two-Player Zero-Sum Games</title><link>https://pair-lab.ai/publication/neurips2021_1/</link><pubDate>Mon, 06 Dec 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips2021_1/</guid><description/></item><item><title>LIGS: Learnable Intrinsic-Reward Generation Selection for Multi-Agent Learning</title><link>https://pair-lab.ai/publication/iclr_2022_1/</link><pubDate>Sun, 05 Dec 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2022_1/</guid><description/></item><item><title>Trust Region Policy Optimisation in Multi-Agent Reinforcement Learning</title><link>https://pair-lab.ai/publication/iclr_2022_2/</link><pubDate>Thu, 23 Sep 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/iclr_2022_2/</guid><description/></item><item><title>Settling the Variance of Multi-Agent Policy Gradients</title><link>https://pair-lab.ai/publication/neurips2021_3/</link><pubDate>Thu, 19 Aug 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips2021_3/</guid><description/></item><item><title>Towards Unifying Behavioral and Response Diversity for Open-ended Learning in Zero-sum Games</title><link>https://pair-lab.ai/publication/neurips2021_2/</link><pubDate>Wed, 09 Jun 2021 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/neurips2021_2/</guid><description/></item></channel></rss>