@inproceedings{6cd36f1433e64ec4b00d5c667392e460,
title = "The Variance-Penalized Stochastic Shortest Path Problem",
abstract = "The stochastic shortest path problem (SSPP) asks to resolve the non-deterministic choices in a Markov decision process (MDP) such that the expected accumulated weight before reaching a target state is maximized. This paper addresses the optimization of the variance-penalized expectation (VPE) of the accumulated weight, which is a variant of the SSPP in which a multiple of the variance of accumulated weights is incurred as a penalty. It is shown that the optimal VPE in MDPs with non-negative weights as well as an optimal deterministic finite-memory scheduler can be computed in exponential space. The threshold problem whether the maximal VPE exceeds a given rational is shown to be EXPTIME-hard and to lie in NEXPTIME. Furthermore, a result of interest in its own right obtained on the way is that a variance-minimal scheduler among all expectation-optimal schedulers can be computed in polynomial time.",
keywords = "Markov decision process, stochastic shortest path problem, variance",
author = "Jakob Piribauer and Ocan Sankur and Christel Baier",
note = "Publisher Copyright: {\textcopyright} Jakob Piribauer, Ocan Sankur, and Christel Baier; licensed under Creative Commons License CC-BY 4.0; 49th EATCS International Conference on Automata, Languages, and Programming, ICALP 2022 ; Conference date: 04-07-2022 Through 08-07-2022",
year = "2022",
month = jul,
day = "1",
doi = "10.4230/LIPIcs.ICALP.2022.129",
language = "English",
series = "Leibniz International Proceedings in Informatics, LIPIcs",
publisher = "Schloss Dagstuhl- Leibniz-Zentrum fur Informatik GmbH, Dagstuhl Publishing",
editor = "Mikolaj Bojanczyk and Emanuela Merelli and Woodruff, {David P.}",
booktitle = "49th EATCS International Conference on Automata, Languages, and Programming, ICALP 2022",
}