<?xml version="1.0"?>
<dblpperson name="Yaniv Oren" pid="331/8510" n="11">
<person key="homepages/331/8510" mdate="2022-10-28">
<author pid="331/8510">Yaniv Oren</author>
</person>
<r><article publtype="informal" key="journals/corr/abs-2602-18857" mdate="2026-03-29">
<author pid="286/5559">Joery A. de Vries</author>
<author pid="274/6365">Jinke He</author>
<author pid="331/8510">Yaniv Oren</author>
<author pid="374/3312">Pascal R. van der Vaart</author>
<author pid="91/3015">Mathijs de Weerdt</author>
<author pid="27/6431">Matthijs T. J. Spaan</author>
<title>VariBASed: Variational Bayes-Adaptive Sequential Monte-Carlo Planning for Deep Reinforcement Learning.</title>
<year>2026</year>
<month>February</month>
<volume>abs/2602.18857</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2602.18857</ee>
<url>db/journals/corr/corr2602.html#abs-2602-18857</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><inproceedings key="conf/iclr/OrenVSB25" mdate="2025-05-15">
<author pid="331/8510">Yaniv Oren</author>
<author pid="404/8762">Viliam Vadocz</author>
<author pid="27/6431">Matthijs T. J. Spaan</author>
<author pid="08/9988">Wendelin Boehmer</author>
<title>Epistemic Monte Carlo Tree Search.</title>
<year>2025</year>
<booktitle>ICLR</booktitle>
<ee type="oa">https://openreview.net/forum?id=Tb8RiXOc3N</ee>
<crossref>conf/iclr/2025</crossref>
<url>db/conf/iclr/iclr2025.html#OrenVSB25</url>
</inproceedings>
</r>
<r><inproceedings key="conf/icml/VriesHOS25" mdate="2026-02-04">
<author pid="286/5559">Joery A. de Vries</author>
<author pid="274/6365">Jinke He</author>
<author pid="331/8510">Yaniv Oren</author>
<author pid="27/6431">Matthijs T. J. Spaan</author>
<title>Trust-Region Twisted Policy Improvement.</title>
<year>2025</year>
<booktitle>ICML</booktitle>
<ee type="oa">https://proceedings.mlr.press/v267/de-vries25a.html</ee>
<ee type="oa">https://openreview.net/forum?id=N0jZKugEuS</ee>
<crossref>conf/icml/2025</crossref>
<url>db/conf/icml/icml2025.html#VriesHOS25</url>
</inproceedings>
</r>
<r><article publtype="informal" key="journals/corr/abs-2504-06048" mdate="2025-05-21">
<author pid="286/5559">Joery A. de Vries</author>
<author pid="274/6365">Jinke He</author>
<author pid="331/8510">Yaniv Oren</author>
<author pid="27/6431">Matthijs T. J. Spaan</author>
<title>Trust-Region Twisted Policy Improvement.</title>
<year>2025</year>
<month>April</month>
<volume>abs/2504.06048</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2504.06048</ee>
<url>db/journals/corr/corr2504.html#abs-2504-06048</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2505-21119" mdate="2025-06-27">
<author pid="290/1950">Moritz A. Zanger</author>
<author pid="349/0201">Max Weltevrede</author>
<author pid="331/8510">Yaniv Oren</author>
<author pid="374/3312">Pascal R. van der Vaart</author>
<author pid="275/3502">Caroline Horsch</author>
<author pid="08/9988">Wendelin B&#246;hmer</author>
<author pid="27/6431">Matthijs T. J. Spaan</author>
<title>Universal Value-Function Uncertainties.</title>
<year>2025</year>
<month>May</month>
<volume>abs/2505.21119</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2505.21119</ee>
<url>db/journals/corr/corr2505.html#abs-2505-21119</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2506-04398" mdate="2025-07-06">
<author pid="365/5726">Th&#233;o Vincent</author>
<author pid="241/5607">Yogesh Tripathi</author>
<author pid="391/5795">Tim Lukas Faust</author>
<author pid="331/8510">Yaniv Oren</author>
<author pid="p/JanPeters1">Jan Peters 0001</author>
<author pid="182/8953">Carlo D'Eramo</author>
<title>Bridging the Performance Gap Between Target-Free and Target-Based Reinforcement Learning With Iterated Q-Learning.</title>
<year>2025</year>
<month>June</month>
<volume>abs/2506.04398</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2506.04398</ee>
<url>db/journals/corr/corr2506.html#abs-2506-04398</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2506-15756" mdate="2025-07-11">
<author pid="262/6483">Jo&#227;o G. Ribeiro</author>
<author pid="331/8510">Yaniv Oren</author>
<author pid="91/515">Alberto Sardinha</author>
<author pid="27/6431">Matthijs T. J. Spaan</author>
<author pid="86/839">Francisco S. Melo</author>
<title>RecBayes: Recurrent Bayesian Ad Hoc Teamwork in Large Partially Observable Domains.</title>
<year>2025</year>
<month>June</month>
<volume>abs/2506.15756</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2506.15756</ee>
<url>db/journals/corr/corr2506.html#abs-2506-15756</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2511-14220" mdate="2026-01-14">
<author pid="331/8510">Yaniv Oren</author>
<author pid="286/5559">Joery A. de Vries</author>
<author pid="374/3312">Pascal R. van der Vaart</author>
<author pid="27/6431">Matthijs T. J. Spaan</author>
<author pid="08/9988">Wendelin B&#246;hmer</author>
<title>Parallelizing Tree Search with Twice Sequential Monte Carlo.</title>
<year>2025</year>
<month>November</month>
<volume>abs/2511.14220</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2511.14220</ee>
<url>db/journals/corr/corr2511.html#abs-2511-14220</url>
<stream>streams/journals/corr</stream>
</article>
</r>
<r><article key="journals/jocn/OrenKK24" mdate="2025-05-09">
<author pid="331/8510">Yaniv Oren</author>
<author orcid="0000-0003-1895-0189" pid="121/9166">Maria Korman</author>
<author pid="128/7314">Avi Karni</author>
<title>Paradoxical Long-term Memory Augmentation following Temporal Pairing between &#34;Limited&#34; and &#34;Extensive&#34; Motor Sequence Training Experiences.</title>
<pages>2807-2821</pages>
<year>2024</year>
<volume>36</volume>
<journal>J. Cogn. Neurosci.</journal>
<number>12</number>
<ee>https://doi.org/10.1162/jocn_a_02186</ee>
<url>db/journals/jocn/jocn36.html#OrenKK24</url>
<stream>streams/journals/jocn</stream>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2406-01423" mdate="2025-05-31">
<author pid="331/8510">Yaniv Oren</author>
<author orcid="0000-0002-3827-1143" pid="290/1950">Moritz A. Zanger</author>
<author pid="374/3312">Pascal R. van der Vaart</author>
<author pid="27/6431">Matthijs T. J. Spaan</author>
<author orcid="0000-0002-4398-6792" pid="08/9988">Wendelin B&#246;hmer</author>
<title>Value Improved Actor Critic Algorithms.</title>
<year>2024</year>
<volume>abs/2406.01423</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2406.01423</ee>
<url>db/journals/corr/corr2406.html#abs-2406-01423</url>
</article>
</r>
<r><article publtype="informal" key="journals/corr/abs-2210-13455" mdate="2023-09-30">
<author pid="331/8510">Yaniv Oren</author>
<author pid="27/6431">Matthijs T. J. Spaan</author>
<author orcid="0000-0002-4398-6792" pid="08/9988">Wendelin B&#246;hmer</author>
<title>Planning with Uncertainty: Deep Exploration in Model-Based Reinforcement Learning.</title>
<year>2022</year>
<volume>abs/2210.13455</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2210.13455</ee>
<url>db/journals/corr/corr2210.html#abs-2210-13455</url>
</article>
</r>
<coauthors n="20" nc="3">
<co c="0" n="2"><na f="b/B=ouml=hmer:Wendelin" pid="08/9988">Wendelin B&#246;hmer</na><na>Wendelin Boehmer</na></co>
<co c="1"><na f="d/D=Eramo:Carlo" pid="182/8953">Carlo D'Eramo</na></co>
<co c="1"><na f="f/Faust:Tim_Lukas" pid="391/5795">Tim Lukas Faust</na></co>
<co c="0"><na f="h/He:Jinke" pid="274/6365">Jinke He</na></co>
<co c="0"><na f="h/Horsch:Caroline" pid="275/3502">Caroline Horsch</na></co>
<co c="2"><na f="k/Karni:Avi" pid="128/7314">Avi Karni</na></co>
<co c="2"><na f="k/Korman:Maria" pid="121/9166">Maria Korman</na></co>
<co c="0"><na f="m/Melo:Francisco_S=" pid="86/839">Francisco S. Melo</na></co>
<co c="1"><na f="p/Peters_0001:Jan" pid="p/JanPeters1">Jan Peters 0001</na></co>
<co c="0"><na f="r/Ribeiro:Jo=atilde=o_G=" pid="262/6483">Jo&#227;o G. Ribeiro</na></co>
<co c="0"><na f="s/Sardinha:Alberto" pid="91/515">Alberto Sardinha</na></co>
<co c="0"><na f="s/Spaan:Matthijs_T=_J=" pid="27/6431">Matthijs T. J. Spaan</na></co>
<co c="1"><na f="t/Tripathi:Yogesh" pid="241/5607">Yogesh Tripathi</na></co>
<co c="0"><na f="v/Vaart:Pascal_R=_van_der" pid="374/3312">Pascal R. van der Vaart</na></co>
<co c="0"><na f="v/Vadocz:Viliam" pid="404/8762">Viliam Vadocz</na></co>
<co c="1"><na f="v/Vincent:Th=eacute=o" pid="365/5726">Th&#233;o Vincent</na></co>
<co c="0"><na f="v/Vries:Joery_A=_de" pid="286/5559">Joery A. de Vries</na></co>
<co c="0"><na f="w/Weerdt:Mathijs_de" pid="91/3015">Mathijs de Weerdt</na></co>
<co c="0"><na f="w/Weltevrede:Max" pid="349/0201">Max Weltevrede</na></co>
<co c="0"><na f="z/Zanger:Moritz_A=" pid="290/1950">Moritz A. Zanger</na></co>
</coauthors>
</dblpperson>

