Reinforcement Learning: Publications
Click here to download all publications in a single bibtex file
@inbook{Hoffman:2012, title = "Inference Strategies for Solving Semi-{Markov} Decision Processes", author = "Matthew Hoffman and Nando de Freitas", year = "2012", chapter = "5", editor = "Enrique Sucar and Eduardo F. Morales and Jesse Hoey", pages = "82--96", publisher = "Hershey: IGI Global", url = "http://mlg.eng.cam.ac.uk/hoffmanm/publications/_download/2010-smdp.pdf", }
@article{Hoffman:2009b, title = "An Expectation Maximization Algorithm for Continuous {Markov} Decision Processes with Arbitrary Reward", author = "Matthew Hoffman and Nando de Freitas and Arnaud Doucet and Jan Peters", year = "2009", journal = "Journal of Machine Learning Research - Proceedings Track for Artificial Intelligence and Statistics (AISTATS)", pages = "232--239", url = "http://jmlr.org/proceedings/papers/v5/hoffman09a.html", volume = "5", }
@article{Cantin:2009, title = "A Bayesian exploration-exploitation approach for optimal online sensing and planning with a visually guided mobile robot", author = "Martinez-Cantin, Ruben and Freitas, Nando and Brochu, Eric and Castellanos, José and Doucet, Arnaud", year = "2009", issn = "0929-5593", journal = "Autonomous Robots", number = "2", pages = "93--103", publisher = "Springer US", url = "http://dx.doi.org/10.1007/s10514-009-9130-2", volume = "27", doi = "10.1007/s10514-009-9130-2", }
@inproceedings{Hoffman:2009, title = "New inference strategies for solving {Markov} Decision Processes using reversible jump {MCMC}", author = "Matthias Hoffman and Hendrik Kueck and Nando de Freitas and Arnaud Doucet", year = "2009", address = "Corvallis, Oregon", booktitle = "Uncertainty in Artificial Intelligence (UAI)", pages = "223--231", url = "http://uai.sis.pitt.edu/displayArticleDetails.jsp?mmnu=2&smnu=2&article_id=1658&author_id=4", }
@incollection{Kueck:2009 year={2009}, title = "Inference and Learning for Active Sensing, Experimental Design and Control", author = "Kueck, Hendrik and Hoffman, Matt and Doucet, Arnaud and Freitas, Nando", year = "2009", booktitle = "Pattern Recognition and Image Analysis", editor = "Araujo, Helder and Mendonca, Ana Maria and Pinho, Armando J. and Torres, Maria Ines", isbn = "978-3-642-02171-8", pages = "1--10", publisher = "Springer Berlin Heidelberg", series = "Lecture Notes in Computer Science", url = "http://dx.doi.org/10.1007/978-3-642-02172-5_1", volume = "5524", doi = "10.1007/978-3-642-02172-5_1", }
@inproceedings{Vogel:2008, title = "Target-directed attention: Sequential decision-making for gaze planning", author = "Vogel, J. and de Freitas, N.", year = "2008", booktitle = "IEEE International Conference on Robotics and Automation (ICRA)", issn = "1050-4729", keywords = "Bayes methods;decision making;planning (artificial intelligence);robot vision;bottom-up attention system;bottom-up saliency information;context information;direct policy search;featural visual saliency;finite-horizon Bayesian sequential decision process;gaze planning;gaze sequence;next best gaze location;object detection precision;probabilistic system;sequential decision making;target-directed attention system;top-down target knowledge;visual search;Bayesian methods;Cameras;Decision making;Detectors;Image analysis;Laboratories;Object detection;Robot vision systems;Robotics and automation;USA Councils", pages = "2372--2379", doi = "10.1109/ROBOT.2008.4543568", }
@incollection{Hoffman:2007, title = "Bayesian Policy Learning with Trans-Dimensional {MCMC}", author = "Matthew Hoffman and Arnaud Doucet and Nando de Freitas and Ajay Jasra", year = "2007", address = "Cambridge, MA", booktitle = "Advances in Neural Information Processing Systems 20", editor = "J.C. Platt and D. Koller and Y. Singer and S. Roweis", pages = "665--672", publisher = "MIT Press", url = "http://nips.cc/Conferences/2007/Program/event.php?ID=663", }
@inproceedings{Menendez:2003, title = "Estimation and control of industrial processes with particle filters", author = "Morales-Menendez, R. and de Freitas, N. and Poole, D.", year = "2003", booktitle = "American Control Conference", issn = "0743-1619", pages = "579--584", url = "http://www.cs.ubc.ca/~nando/papers/itesmpaper.pdf", volume = "1", doi = "10.1109/ACC.2003.1239081", }