Scaling Up Average Reward Reinforcement Learning by Approximating the Domain Models and the Value Function
From Tetherless World Wiki
\begin{bibtex} @inproceedings{DBLP:conf/icml/TadepalliO96,
author = {Prasad Tadepalli and
DoKyeong Ok},
title = {Scaling Up Average Reward Reinforcement Learning by Approximating
the Domain Models and the Value Function},
booktitle = {ICML},
year = {1996},
pages = {471-479},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
\end{bibtex}
