<?xml version="1.0"?>
<dblpperson name="Zhuohao Yu 0003" pid="430/9934" n="2">
<person key="homepages/430/9934" mdate="2026-04-17">
<author pid="430/9934">Zhuohao Yu 0003</author>
<note type="affiliation">Carnegie Mellon University, Pittsburgh, PA, USA</note>
</person>
<homonyms n="3">
<h f="y/Yu:Zhuohao"><name>Zhuohao Yu</name>
</h>
<h f="y/Yu_0001:Zhuohao"><person key="homepages/319/6890" mdate="2025-05-21">
<author pid="319/6890">Zhuohao Yu 0001</author>
<note type="affiliation">Peking University, Beijing, China</note>
<note label="former" type="affiliation">Renmin University of China, School of Information, China</note>
<url>https://zhuohaoyu.github.io/</url>
<url>https://scholar.google.com/citations?user=zVYE7-UAAAAJ</url>
<url>https://github.com/zhuohaoyu</url>
<url>https://orcid.org/0009-0000-8256-8588</url>
</person>
</h>
<h f="y/Yu_0002:Zhuohao"><person key="homepages/319/6890-2" mdate="2025-07-11">
<author pid="319/6890-2">Zhuohao Yu 0002</author>
<note type="affiliation">Chinese Academy of Sciences, Institute of Software, Beijing, China</note>
<url>https://scholar.google.com/citations?user=mTbIqosAAAAJ</url>
<url>https://orcid.org/0009-0006-0037-0396</url>
<url>https://www.wikidata.org/entity/Q130803334</url>
</person>
</h>
</homonyms>
<r><article publtype="informal" key="journals/corr/abs-2602-19041" mdate="2026-04-17">
<author pid="123/4950">Jiahao Zhang</author>
<author pid="365/3111">Lujing Zhang</author>
<author pid="374/9630">Keltin Grimes</author>
<author pid="430/9934">Zhuohao Yu 0003</author>
<author pid="31/11509-1">Gokul Swamy 0001</author>
<author pid="137/8350">Zhiwei Steven Wu</author>
<title>Back to Blackwell: Closing the Loop on Intransitivity in Multi-Objective Preference Fine-Tuning.</title>
<year>2026</year>
<month>February</month>
<volume>abs/2602.19041</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2602.19041</ee>
<url>db/journals/corr/corr2602.html#abs-2602-19041</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2604-04648" mdate="2026-05-08">
<author pid="430/9934">Zhuohao Yu 0003</author>
<author pid="137/8350">Zhiwei Steven Wu</author>
<author pid="258/1018">Adam Block</author>
<title>From Curiosity to Caution: Mitigating Reward Hacking for Best-of-N with Pessimism.</title>
<year>2026</year>
<month>April</month>
<volume>abs/2604.04648</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2604.04648</ee>
<url>db/journals/corr/corr2604.html#abs-2604-04648</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<coauthors n="6" nc="1">
<co c="0"><na f="b/Block:Adam" pid="258/1018">Adam Block</na></co>
<co c="0"><na f="g/Grimes:Keltin" pid="374/9630">Keltin Grimes</na></co>
<co c="0"><na f="s/Swamy_0001:Gokul" pid="31/11509-1">Gokul Swamy 0001</na></co>
<co c="0"><na f="w/Wu:Zhiwei_Steven" pid="137/8350">Zhiwei Steven Wu</na></co>
<co c="0"><na f="z/Zhang:Jiahao" pid="123/4950">Jiahao Zhang</na></co>
<co c="0"><na f="z/Zhang:Lujing" pid="365/3111">Lujing Zhang</na></co>
</coauthors>
</dblpperson>

