dc.contributor.author | Barry, Jennifer | |
dc.contributor.author | Kaelbling, Leslie P. | |
dc.contributor.author | Lozano-Perez, Tomas | |
dc.date.accessioned | 2011-03-03T19:04:22Z | |
dc.date.available | 2011-03-03T19:04:22Z | |
dc.date.issued | 2010-05 | |
dc.date.submitted | 2010-03 | |
dc.identifier.uri | http://hdl.handle.net/1721.1/61387 | |
dc.description.abstract | This paper presents an algorithm for finding approximately
optimal policies in very large Markov decision processes by
constructing a hierarchical model and then solving it. This
strategy sacrifices optimality for the ability to address a large
class of very large problems. Our algorithm works efficiently
on enumerated-states and factored MDPs by constructing a
hierarchical structure that is no larger than both the reduced
model of the MDP and the regression tree for the goal in that
MDP, and then using that structure to solve for a policy. | en_US |
dc.language.iso | en_US | |
dc.publisher | Association for the Advancement of Artificial Intelligence | en_US |
dc.relation.isversionof | http://digital.cs.usu.edu/~danbryce/icaps10/PSUWS/Accepted_Papers.html | en_US |
dc.rights | Attribution-Noncommercial-Share Alike 3.0 Unported | en_US |
dc.rights.uri | http://creativecommons.org/licenses/by/3.0 | en_US |
dc.source | MIT web domain | en_US |
dc.title | Hierarchical Solution of Large Markov Decision Processes | en_US |
dc.type | Article | en_US |
dc.identifier.citation | Barry, Jennifer, Leslie Pack Kaelbling and Tomas Lozano-Perez. "Hierarchical Solution of Large Markov Decision Processes." ICAPS-10 Workshop on Planning and Scheduling Under Uncertainty, Toronto, Canada, May 12-16, 2010. | en_US |
dc.contributor.department | Massachusetts Institute of Technology. Department of Electrical Engineering and Computer Science | en_US |
dc.contributor.approver | Kaelbling, Leslie P. | |
dc.contributor.mitauthor | Barry, Jennifer | |
dc.contributor.mitauthor | Kaelbling, Leslie P. | |
dc.contributor.mitauthor | Lozano-Perez, Tomas | |
dc.relation.journal | ICAPS-10 Workshop on Planning and Scheduling Under Uncertainty, 2010 | en_US |
dc.eprint.version | Author's final manuscript | en_US |
dc.type.uri | http://purl.org/eprint/type/ConferencePaper | en_US |
eprint.status | http://purl.org/eprint/status/PeerReviewed | en_US |
dspace.orderedauthors | Barry, Jennifer; Kaelbling, Leslie Pack; Lozano-Perez, Tomas | |
dc.identifier.orcid | https://orcid.org/0000-0002-8657-2450 | |
dc.identifier.orcid | https://orcid.org/0000-0001-6054-7145 | |
dspace.mitauthor.error | true | |
mit.license | OPEN_ACCESS_POLICY | en_US |
mit.metadata.status | Complete | |