@article{13:103,author={Mohammad Gheshlaghi Azar and Vicen Gmez and Hilbert J. Kappen}, Title={Dynamic Policy Programming},journal={Journal of Machine Learning Research},volume={13}, url={http://www.jmlr.org/papers/volume13/azar12a/azar12a.pdf}}