@article{DBLP:journals/jmlr/MatsubaraMM10,
author = {Takamitsu Matsubara and
Tetsuro Morimura and
Jun Morimoto},
title = {Adaptive Step-size Policy Gradients with Average Reward
Metric},
journal = {Journal of Machine Learning Research - Proceedings Track},
volume = {13},
year = {2010},
pages = {285-298},
ee = {http://www.jmlr.org/proceedings/papers/v13/matsubara10a.html},
bibsource = {DBLP, http://dblp.uni-trier.de}
}