<?xml version="1.0"?>
<dblpperson name="Anand Kannappan" pid="360/9782" n="10">
<person key="homepages/360/9782" mdate="2023-11-21">
<author pid="360/9782">Anand Kannappan</author>
</person>
<r><article publtype="informal" key="journals/corr/abs-2601-20103" mdate="2026-02-26">
<author pid="299/1910">Darshan Deshpande</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="254/0997">Rebecca Qian</author>
<title>Benchmarking Reward Hack Detection in Code Environments via Contrastive Analysis.</title>
<year>2026</year>
<month>January</month>
<volume>abs/2601.20103</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2601.20103</ee>
<url>db/journals/corr/corr2601.html#abs-2601-20103</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2602-00352" mdate="2026-03-11">
<author pid="391/2667">Li Siyan</author>
<author pid="299/1910">Darshan Deshpande</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="254/0997">Rebecca Qian</author>
<title>DETOUR: An Interactive Benchmark for Dual-Agent Search and Reasoning.</title>
<year>2026</year>
<month>February</month>
<volume>abs/2602.00352</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2602.00352</ee>
<url>db/journals/corr/corr2602.html#abs-2602-00352</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><inproceedings key="conf/acl/CH-WangDMKQ25" mdate="2025-07-24">
<author pid="301/9138">Sky CH-Wang</author>
<author pid="299/1910">Darshan Girish Deshpande</author>
<author pid="44/70">Smaranda Muresan</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="254/0997">Rebecca Qian</author>
<title>Browsing Lost Unformed Recollections: A Benchmark for Tip-of-the-Tongue Search and Reasoning.</title>
<pages>8317-8331</pages>
<year>2025</year>
<booktitle>ACL (1)</booktitle>
<ee type="oa">https://aclanthology.org/2025.acl-long.406/</ee>
<crossref>conf/acl/2025-1</crossref>
<url>db/conf/acl/acl2025-1.html#CH-WangDMKQ25</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/abs-2503-19193" mdate="2025-04-19">
<author pid="301/9138">Sky CH-Wang</author>
<author pid="299/1910">Darshan Deshpande</author>
<author pid="44/70">Smaranda Muresan</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="254/0997">Rebecca Qian</author>
<title>Browsing Lost Unformed Recollections: A Benchmark for Tip-of-the-Tongue Search and Reasoning.</title>
<year>2025</year>
<month>March</month>
<volume>abs/2503.19193</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2503.19193</ee>
<url>db/journals/corr/corr2503.html#abs-2503-19193</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2505-08638" mdate="2025-06-23">
<author pid="299/1910">Darshan Deshpande</author>
<author pid="178/8576">Varun Gangal</author>
<author pid="408/0805">Hersh Mehta</author>
<author pid="239/6720">Jitin Krishnan</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="254/0997">Rebecca Qian</author>
<title>TRAIL: Trace Reasoning and Agentic Issue Localization.</title>
<year>2025</year>
<month>May</month>
<volume>abs/2505.08638</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2505.08638</ee>
<url>db/journals/corr/corr2505.html#abs-2505-08638</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2510-01353" mdate="2025-11-08">
<author pid="299/1910">Darshan Deshpande</author>
<author pid="178/8576">Varun Gangal</author>
<author pid="408/0805">Hersh Mehta</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="254/0997">Rebecca Qian</author>
<author pid="95/4442">Peng Wang</author>
<title>MEMTRACK: Evaluating Long-Term Memory and State Tracking in Multi-Platform Dynamic Agent Environments.</title>
<year>2025</year>
<month>October</month>
<volume>abs/2510.01353</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2510.01353</ee>
<url>db/journals/corr/corr2510.html#abs-2510-01353</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2407-08488" mdate="2024-08-16">
<author pid="267/5023">Selvan Sunitha Ravi</author>
<author pid="05/1465">Bartosz Mielczarek</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="136/9140">Douwe Kiela</author>
<author pid="254/0997">Rebecca Qian</author>
<title>Lynx: An Open Source Hallucination Evaluation Model.</title>
<year>2024</year>
<volume>abs/2407.08488</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2407.08488</ee>
<url>db/journals/corr/corr2407.html#abs-2407-08488</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2412-14140" mdate="2025-01-23">
<author pid="299/1910">Darshan Deshpande</author>
<author pid="267/5023">Selvan Sunitha Ravi</author>
<author pid="301/9138">Sky CH-Wang</author>
<author pid="05/1465">Bartosz Mielczarek</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="254/0997">Rebecca Qian</author>
<title>GLIDER: Grading LLM Interactions and Decisions using Explainable Ranking.</title>
<year>2024</year>
<volume>abs/2412.14140</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2412.14140</ee>
<url>db/journals/corr/corr2412.html#abs-2412-14140</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2311-08370" mdate="2023-11-21">
<author pid="175/1517">Bertie Vidgen</author>
<author pid="284/9434">Hannah Rose Kirk</author>
<author pid="254/0997">Rebecca Qian</author>
<author pid="295/0198">Nino Scherrer</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="32/10840">Scott A. Hale</author>
<author pid="282/4243">Paul R&#246;ttger</author>
<title>SimpleSafetyTests: a Test Suite for Identifying Critical Safety Risks in Large Language Models.</title>
<year>2023</year>
<volume>abs/2311.08370</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2311.08370</ee>
<url>db/journals/corr/corr2311.html#abs-2311-08370</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2311-11944" mdate="2023-11-23">
<author pid="324/8464">Pranab Islam</author>
<author pid="360/9782">Anand Kannappan</author>
<author pid="136/9140">Douwe Kiela</author>
<author pid="254/0997">Rebecca Qian</author>
<author pid="295/0198">Nino Scherrer</author>
<author pid="175/1517">Bertie Vidgen</author>
<title>FinanceBench: A New Benchmark for Financial Question Answering.</title>
<year>2023</year>
<volume>abs/2311.11944</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2311.11944</ee>
<url>db/journals/corr/corr2311.html#abs-2311-11944</url>
</article>
</r>
<coauthors n="18" nc="1">
<co c="0"><na f="c/CH=Wang:Sky" pid="301/9138">Sky CH-Wang</na></co>
<co c="0" n="2"><na f="d/Deshpande:Darshan" pid="299/1910">Darshan Deshpande</na><na>Darshan Girish Deshpande</na></co>
<co c="0"><na f="g/Gangal:Varun" pid="178/8576">Varun Gangal</na></co>
<co c="0"><na f="h/Hale:Scott_A=" pid="32/10840">Scott A. Hale</na></co>
<co c="0"><na f="i/Islam:Pranab" pid="324/8464">Pranab Islam</na></co>
<co c="0"><na f="k/Kiela:Douwe" pid="136/9140">Douwe Kiela</na></co>
<co c="0" n="2"><na f="k/Kirk:Hannah" pid="284/9434">Hannah Kirk</na><na>Hannah Rose Kirk</na></co>
<co c="0"><na f="k/Krishnan:Jitin" pid="239/6720">Jitin Krishnan</na></co>
<co c="0"><na f="m/Mehta:Hersh" pid="408/0805">Hersh Mehta</na></co>
<co c="0"><na f="m/Mielczarek:Bartosz" pid="05/1465">Bartosz Mielczarek</na></co>
<co c="0"><na f="m/Muresan:Smaranda" pid="44/70">Smaranda Muresan</na></co>
<co c="0"><na f="q/Qian:Rebecca" pid="254/0997">Rebecca Qian</na></co>
<co c="0"><na f="r/Ravi:Selvan_Sunitha" pid="267/5023">Selvan Sunitha Ravi</na></co>
<co c="0"><na f="r/R=ouml=ttger:Paul" pid="282/4243">Paul R&#246;ttger</na></co>
<co c="0"><na f="s/Scherrer:Nino" pid="295/0198">Nino Scherrer</na></co>
<co c="0"><na f="s/Siyan:Li" pid="391/2667">Li Siyan</na></co>
<co c="0"><na f="v/Vidgen:Bertie" pid="175/1517">Bertie Vidgen</na></co>
<co c="0"><na f="w/Wang:Peng" pid="95/4442">Peng Wang</na></co>
</coauthors>
</dblpperson>

