@COMMENT This file was generated by bib2html.pl <http://www.cs.cmu.edu/~pfr/misc_software/index.html#bib2html> version 0.90
@COMMENT written by Patrick Riley <http://www.cs.cmu.edu/~pfr>
@COMMENT This file came from Peter Stone's publication pages at
@COMMENT http://www.cs.utexas.edu/~pstone/papers
@InProceedings{ICDL10-hester,
	author="Todd Hester and Peter Stone",
	title="Real Time Targeted Exploration in Large Domains",
	booktitle = "The Ninth International Conference on Development and Learning (ICDL)",
	location = "Ann Arbor, Michigan",
	month = "August",
	year = "2010",
	abstract = "A developing agent needs to explore to learn about
		the world and learn good behaviors. In many real world tasks,
		this exploration can take far too long, and the agent must make
		decisions about which states to explore, and which states not
		to explore. Bayesian methods attempt to address this problem,
		but take too much computation time to run in reasonably sized
		domains. In this paper, we present TEXPLORE, the first algorithm
		to perform targeted exploration in real time in large domains.
		The algorithm learns multiple possible models of the domain
		that generalize action effects across states. We experiment with
		possible ways of adding intrinsic motivation to the agent to drive
		exploration. TEXPLORE is fully implemented and tested in a novel
		domain called Fuel World that is designed to reflect the type of
		targeted exploration needed in the real world. We show that
		our algorithm significantly outperforms representative examples
		of both model-free and model-based RL algorithms from the
		literature and is able to quickly learn to perform well in a large
		world in real-time.",
	wwwnote={<a href="http://www.eecs.umich.edu/icdl-2010/">ICDL 2010</a>},
}
