@inproceedings{09aa0ca5418b4b328734a53299272af8,
title = "Deriving Explicit Control Policies for Markov Decision Processes Using Symbolic Regression",
abstract = "In this paper, we introduce a novel approach to optimizing the control of systems that can be modeled as Markov decision processes (MDPs) with a threshold-based optimal policy. Our method is based on a specific type of genetic program known as symbolic regression (SR). We present how the performance of this program can be greatly improved by taking into account the corresponding MDP framework in which we apply it. The proposed method has two main advantages: (1) it results in near-optimal decision policies, and (2) in contrast to other algorithms, it generates closed-form approximations. Obtaining an explicit expression for the decision policy gives the opportunity to conduct sensitivity analysis, and allows instant calculation of a new threshold function for any change in the parameters. We emphasize that the introduced technique is highly general and applicable to MDPs that have a threshold-based policy. Extensive experimentation demonstrates the usefulness of the method.",
keywords = "Closed-form approximation, Genetic program, Markov Decision Processes, Optimal control, Symbolic regression, Threshold-Type policy",
author = "A. Hristov and Bosman, {J. W.} and S. Bhulai and {Van Der Mei}, {R. D.}",
year = "2020",
month = may,
doi = "10.1145/3388831.3388840",
language = "English",
series = "ACM International Conference Proceeding Series",
publisher = "Association for Computing Machinery",
pages = "41--47",
booktitle = "VALUETOOLS '20",
note = "13th EAI International Conference on Performance Evaluation Methodologies and Tools, VALUETOOLS 2020 ; Conference date: 18-05-2020 Through 20-05-2020",
}