<?xml version="1.0" encoding="utf-8" standalone="yes"?><rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom"><channel><title>Yinmin Zhang | PAIR Lab: PKU Alignment and Interaction Research Lab</title><link>https://pair-lab.ai/author/yinmin-zhang/</link><atom:link href="https://pair-lab.ai/author/yinmin-zhang/index.xml" rel="self" type="application/rss+xml"/><description>Yinmin Zhang</description><generator>Hugo Blox Builder (https://hugoblox.com)</generator><language>en-us</language><lastBuildDate>Tue, 03 Dec 2024 00:00:00 +0000</lastBuildDate><image><url>https://pair-lab.ai/media/icon_hu4f2a7092ab9dace538e8dee71ba34a1a_30036_512x512_fill_lanczos_center_3.png</url><title>Yinmin Zhang</title><link>https://pair-lab.ai/author/yinmin-zhang/</link></image><item><title>Adaptive Pessimism via Target Q-Value for Offline Reinforcement Learning</title><link>https://pair-lab.ai/publication/nn_2024/</link><pubDate>Tue, 03 Dec 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/nn_2024/</guid><description/></item><item><title>A Perspective of Q-value Estimation on Offline-to-Online Reinforcement Learning</title><link>https://pair-lab.ai/publication/aaai_2024_2/</link><pubDate>Wed, 06 Mar 2024 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2024_2/</guid><description/></item><item><title>ACE: Cooperative Multi-agent Q-learning with Bidirectional Action-Dependency</title><link>https://pair-lab.ai/publication/aaai_2023_2/</link><pubDate>Tue, 29 Nov 2022 00:00:00 +0000</pubDate><guid>https://pair-lab.ai/publication/aaai_2023_2/</guid><description/></item></channel></rss>