The search for finite-state controllers for partially observable Markov decision processes (POMDPs) is often based on approaches like gradient ascent, attractive because of their relatively low computational cost. In this paper, we illustrate a basic problem with gradient-based methods applied to POMDPs, where the sequential nature of the decision problem is at issue, and propose a new stochastic local search method as an alternative.
%0 Conference Paper
%1 citeulike:126921
%A Braziunas, Darius
%A Boutilier, Craig
%D 2004
%K policy-iteration pomdp
%T Stochastic local search for POMDP controllers
%U http://citeseer.ist.psu.edu/braziunas04stochastic.html
%X The search for finite-state controllers for partially observable Markov decision processes (POMDPs) is often based on approaches like gradient ascent, attractive because of their relatively low computational cost. In this paper, we illustrate a basic problem with gradient-based methods applied to POMDPs, where the sequential nature of the decision problem is at issue, and propose a new stochastic local search method as an alternative.
@inproceedings{citeulike:126921,
abstract = {The search for finite-state controllers for partially observable Markov decision processes (POMDPs) is often based on approaches like gradient ascent, attractive because of their relatively low computational cost. In this paper, we illustrate a basic problem with gradient-based methods applied to POMDPs, where the sequential nature of the decision problem is at issue, and propose a new stochastic local search method as an alternative.},
added-at = {2006-04-12T20:53:54.000+0200},
author = {Braziunas, Darius and Boutilier, Craig},
biburl = {https://www.bibsonomy.org/bibtex/2245734940e0ae9642001197722848fc8/darius},
citeulike-article-id = {126921},
description = {CiteULike},
interhash = {dbef4f2252af0b21af490cf205024dd7},
intrahash = {245734940e0ae9642001197722848fc8},
keywords = {policy-iteration pomdp},
priority = {0},
timestamp = {2006-04-12T20:53:54.000+0200},
title = {Stochastic local search for POMDP controllers},
url = {http://citeseer.ist.psu.edu/braziunas04stochastic.html},
year = 2004
}