
@article{ref1,
title="Uncertainty and exploration in a restless bandit problem",
journal="Topics in cognitive science",
year="2015",
author="Speekenbrink, Maarten and Konstantinidis, Emmanouil",
volume="7",
number="2",
pages="351-367",
abstract="Decision making in noisy and changing environments requires a fine balance between exploiting knowledge about good courses of action and exploring the environment in order to improve upon this knowledge. We present an experiment on a restless bandit task in which participants made repeated choices between options for which the average rewards changed over time. Comparing a number of computational models of participants' behavior in this task, we find evidence that a substantial number of them balanced exploration and exploitation by considering the probability that an option offers the maximum reward out of all the available options.<p /> <p>Language: en</p>",
language="en",
issn="1756-8765",
doi="10.1111/tops.12145",
url="http://dx.doi.org/10.1111/tops.12145"
}