@inproceedings{ce3a34ab46714e8e85f5d60b28ed021d,
title = "Reinforcement Learning with Guarantees that Hold for Ever",
abstract = "Reinforcement learning is a successful explore-and-exploit approach, where a controller tries to learn how to navigate an unknown environment. The principle approach is for an intelligent agent to learn how to maximise expected rewards. But what happens if the objective refers to non-terminating systems? We can obviously not wait until an infinite amount of time has passed, assess the success, and update. But what can we do? This talk will tell.",
keywords = "2023 OA procedure",
author = "Hahn, {Ernst Moritz} and Mateo Perez and Sven Schewe and Fabio Somenzi and Ashutosh Trivedi and Dominik Wojtczak",
year = "2022",
month = sep,
day = "5",
doi = "10.1007/978-3-031-15008-1_1",
language = "English",
isbn = "978-3-031-15007-4",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "3--7",
editor = "Groote, {Jan Friso} and Marieke Huisman",
booktitle = "Formal Methods for Industrial Critical Systems",
address = "Germany",
}