<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0">
  <channel>
    <title>PyPI recent updates for multireward-grpo</title>
    <link>https://pypi.org/project/multireward-grpo/</link>
    <description>Recent updates to the Python Package Index for multireward-grpo</description>
    <language>en</language>    <item>
      <title>0.1.0</title>
      <link>https://pypi.org/project/multireward-grpo/0.1.0/</link>
      <description>Decoupled &amp; conditioned multi-reward GRPO advantage estimators, a generalized trainer, and the Theorem-3 verification harness from the paper &#39;When and Why Decoupling and Conditioning Beat Reweighting in Multi-Reward GRPO&#39;.</description>
<author>eagle0504@gmail.com</author>      <pubDate>Tue, 23 Jun 2026 17:44:32 GMT</pubDate>
    </item>  </channel>
</rss>