@inproceedings{18ab34db1277429eab652c646e1bfbd1,
title = "Distributed Bandits: Probabilistic Communication on d-regular Graphs",
abstract = "We study the decentralized multi-agent multi-armed bandit problem for agents that communicate with probability over a network defined by a d-regular graph. Every edge in the graph has probabilistic weight p to account for the (1 - p) probability of a communication link failure. At each time step, each agent chooses an arm and receives a numerical reward associated with the chosen arm. After each choice, each agent observes the last obtained reward of each of its neighbors with probability p. We propose a new Upper Confidence Bound (UCB) based algorithm and analyze how agent-based strategies contribute to minimizing group regret in this probabilistic communication setting. We provide theoretical guarantees that our algorithm outperforms state-of-the-art algorithms. We illustrate our results and validate the theoretical claims using numerical simulations.",
author = "Udari Madhushani and Leonard, {Naomi Ehrich}",
note = "Publisher Copyright: {\textcopyright} 2021 EUCA.; 2021 European Control Conference, ECC 2021 ; Conference date: 29-06-2021 Through 02-07-2021",
year = "2021",
doi = "10.23919/ECC54610.2021.9655031",
language = "English (US)",
series = "2021 European Control Conference, ECC 2021",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "830--835",
booktitle = "2021 European Control Conference, ECC 2021",
address = "United States",
}