Scaling Model-Based Average-Reward Reinforcement Learning for Product Delivery
From Tetherless World Wiki
\begin{bibtex} @inproceedings{DBLP:conf/ecml/ProperT06,
author = {Scott Proper and
Prasad Tadepalli},
title = {Scaling Model-Based Average-Reward Reinforcement Learning
for Product Delivery},
booktitle = {ECML},
year = {2006},
pages = {735-742},
ee = {http://dx.doi.org/10.1007/11871842_74},
crossref = {DBLP:conf/ecml/2006},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
\end{bibtex}
