@article{CTT100660173, author = {Zhao, T. and Hachiya, H. and Tangkaratt, V. and Morimoto, J. and & Sugiyama, M.}, title = {Efficient sample reuse inpolicy gradients with parameter-based exploration}, journal = {Neural Computation}, year = 2013, } @article{CTT100660280, author = {Zhao, T. and Hachiya, H. and Niu, G. and Sugiyama, M.}, title = {Analysis and improvement of policy gradient estimation}, journal = {Neural Networks}, year = 2012, } @inproceedings{CTT100660114, author = {Mori, S. and Tangkaratt, V. and Zhao, T. and Morimoto, J. and &Sugiyama, M.}, title = {Model-based policy gradients with parameter-based exploration by least-squares conditional density estimation}, booktitle = {IEICE Technical Report}, year = 2013, } @inproceedings{CTT100634727, author = {Zhao, T. and Hachiya, H. and Sugiyama, M.}, title = {Importance-weighted policy gradients with parameter-based exploration.}, booktitle = {IEICE Technical Report, IBISML2011-95}, year = 2012, } @inproceedings{CTT100633501, author = {Zhao, T. and Hachiya, H. and Niu, G. and Sugiyama, M.}, title = {Analysis and improvement of policy gradient estimation.}, booktitle = {IEICE Technical Report, IBISML2011-12}, year = 2012, } @inproceedings{CTT100660130, author = {Zhao, T. and Hachiya, H. and & Sugiyama, M.}, title = {Efficient data reuse in robot control learning via importnace sampling}, booktitle = {}, year = 2012, } @inproceedings{CTT100633484, author = {Zhao, T. and Hachiya, H. and Niu, G. and Sugiyama, M}, title = {Analysis and improvement of policy gradient estimation.}, booktitle = {Advances in Neural Information Processing Systems 24}, year = 2011, } @misc{CTT100687281, author = {TINGTING ZHAO}, title = {Statistical Theory of Reinforcement Learning with Applications to Robot Control}, year = 2014, } @misc{CTT100666783, author = {TINGTING ZHAO}, title = {Statistical Theory of Reinforcement Learning with Applications to Robot Control}, year = 2014, } @misc{CTT100687140, author = {TINGTING ZHAO}, title = {Statistical Theory of Reinforcement Learning with Applications to Robot Control}, year = 2014, } @phdthesis{CTT100687281, author = {TINGTING ZHAO}, title = {Statistical Theory of Reinforcement Learning with Applications to Robot Control}, school = {東京工業大学}, year = 2014, } @phdthesis{CTT100666783, author = {TINGTING ZHAO}, title = {Statistical Theory of Reinforcement Learning with Applications to Robot Control}, school = {東京工業大学}, year = 2014, } @phdthesis{CTT100687140, author = {TINGTING ZHAO}, title = {Statistical Theory of Reinforcement Learning with Applications to Robot Control}, school = {東京工業大学}, year = 2014, }