@inproceedings{fb786f7af8494c708c87a146258c7bd2,
title = "Death and suicide in universal artificial intelligence",
abstract = "Reinforcement learning (RL) is a general paradigm for studying intelligent behaviour, with applications ranging from artificial intelligence to psychology and economics. AIXI is a universal solution to the RL problem; it can learn any computable environment. A technical subtlety of AIXI is that it is defined using a mixture over semimeasures that need not sum to 1, rather than over proper probability measures. In this work we argue that the shortfall of a semimeasure can naturally be interpreted as the agent{\textquoteright}s estimate of the probability of its death. We formally define death for generally intelligent agents like AIXI, and prove a number of related theorems about their behaviour. Notable discoveries include that agent behaviour can change radically under positive linear transformations of the reward signal (from suicidal to dogmatically self-preserving), and that the agent{\textquoteright}s posterior belief that it will survive increases over time.",
author = "Jarryd Martin and Tom Everitt and Marcus Hutter",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing Switzerland 2016.; 9th International Conference on Artificial General Intelligence, AGI 2016 ; Conference date: 16-07-2016 Through 19-07-2016",
year = "2016",
doi = "10.1007/978-3-319-41649-6_3",
language = "English",
isbn = "9783319416489",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "23--32",
editor = "Bas Steunebrink and Pei Wang and Ben Goertzel",
booktitle = "Artificial General Intelligence - 9th International Conference, AGI 2016, Proceedings",
address = "Germany",
}