<?xml version="1.0" encoding="utf-8" standalone="yes" ?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>RLHF | Yang Cai</title>
    <link>http://www.cs.yale.edu/homes/cai/tag/rlhf/</link>
      <atom:link href="http://www.cs.yale.edu/homes/cai/tag/rlhf/index.xml" rel="self" type="application/rss+xml" />
    <description>RLHF</description>
    <generator>Wowchemy (https://wowchemy.com)</generator><language>en-us</language><lastBuildDate>Sun, 04 Jan 2026 18:39:04 -0400</lastBuildDate>
    <image>
      <url>http://www.cs.yale.edu/homes/cai/media/icon_hu2863fb787e1951439c40d39e27eaa50a_1119_512x512_fill_lanczos_center_3.png</url>
      <title>RLHF</title>
      <link>http://www.cs.yale.edu/homes/cai/tag/rlhf/</link>
    </image>
    
    <item>
      <title>COMAL: A Convergent Meta-Algorithm for Aligning LLMs with General Preferences</title>
      <link>http://www.cs.yale.edu/homes/cai/publication/cai-comal-2026/</link>
      <pubDate>Sun, 04 Jan 2026 18:39:04 -0400</pubDate>
      <guid>http://www.cs.yale.edu/homes/cai/publication/cai-comal-2026/</guid>
      <description></description>
    </item>
    
  </channel>
</rss>
