<?xml version="1.0" encoding="US-ASCII"?>
<dblp>
<article key="journals/nn/LiuLWHH26" mdate="2026-03-31">
<author orcid="0009-0002-7766-8802">Wenhui Liu</author>
<author orcid="0009-0002-0328-2026">Kangyang Luo</author>
<author orcid="0000-0002-3040-3287">Zhijian Wu</author>
<author orcid="0009-0005-5492-6727">Shanfeng Hao</author>
<author orcid="0000-0002-0144-7344">Dingjiang Huang</author>
<title>Mitigating OOD overoptimism via in-sample value function in offline reinforcement learning.</title>
<year>2026</year>
<pages>108763</pages>
<volume>200</volume>
<journal>Neural Networks</journal>
<ee>https://doi.org/10.1016/j.neunet.2026.108763</ee>
<url>db/journals/nn/nn200.html#LiuLWHH26</url>
<stream>streams/journals/nn</stream>
</article>
</dblp>
