<?xml version="1.0"?>
<dblp>
<article key="journals/ml/SinghJLS00" mdate="2011-05-26">
<author>Satinder P. Singh</author>
<author>Tommi Jaakkola</author>
<author>Michael L. Littman</author>
<author>Csaba Szepesv&#225;ri</author>
<title>Convergence Results for Single-Step On-Policy Reinforcement-Learning Algorithms.</title>
<pages>287-308</pages>
<year>2000</year>
<volume>38</volume>
<journal>Machine Learning</journal>
<number>3</number>
<url>db/journals/ml/ml38.html#SinghJLS00</url>
<ee>http://dx.doi.org/10.1023/A:1007678930559</ee>
</article>
</dblp>
