We consider the problem of optimally assigning p sniffers to K
channels to monitor the transmission activities in a multi-channel wireless
network. The activity of users is initially unknown to the sniffers and is to
be learned along with channel assignment decisions while maximizing the benifits of this assignment,
resulting in the fundamental trade-off between exploration versus exploitation. We formulate it as the
linear partial monitoring problem, a super-class of multi-armed bandits. As the number of
arms (sniffer-channel assignments) is exponential, novel techniques are called for, to allow efficient learning.
We use the linear bandit model to capture the dependency amongst the arms and develop two policies that take advantage of this dependency.
Both policies enjoy logarithmic regret bound of time-slots with a term that is sub-linear in the number of
arms.
%0 Conference Paper
%1 PaZheSze11
%A Pallavi, A.
%A Zheng, R.
%A Szepesvári, Cs.
%B INFOCOM
%D 2011
%K bandits bandits, networking, networks, stochastic theory, wireless
%P 1152--1160
%T Sequential Learning for Optimal Monitoring of Multi-channel Wireless Networks
%X We consider the problem of optimally assigning p sniffers to K
channels to monitor the transmission activities in a multi-channel wireless
network. The activity of users is initially unknown to the sniffers and is to
be learned along with channel assignment decisions while maximizing the benifits of this assignment,
resulting in the fundamental trade-off between exploration versus exploitation. We formulate it as the
linear partial monitoring problem, a super-class of multi-armed bandits. As the number of
arms (sniffer-channel assignments) is exponential, novel techniques are called for, to allow efficient learning.
We use the linear bandit model to capture the dependency amongst the arms and develop two policies that take advantage of this dependency.
Both policies enjoy logarithmic regret bound of time-slots with a term that is sub-linear in the number of
arms.
@inproceedings{PaZheSze11,
abstract = {We consider the problem of optimally assigning p sniffers to K
channels to monitor the transmission activities in a multi-channel wireless
network. The activity of users is initially unknown to the sniffers and is to
be learned along with channel assignment decisions while maximizing the benifits of this assignment,
resulting in the fundamental trade-off between exploration versus exploitation. We formulate it as the
linear partial monitoring problem, a super-class of multi-armed bandits. As the number of
arms (sniffer-channel assignments) is exponential, novel techniques are called for, to allow efficient learning.
We use the linear bandit model to capture the dependency amongst the arms and develop two policies that take advantage of this dependency.
Both policies enjoy logarithmic regret bound of time-slots with a term that is sub-linear in the number of
arms.},
added-at = {2020-03-17T03:03:01.000+0100},
author = {Pallavi, A. and Zheng, R. and Szepesv{\'a}ri, {Cs}.},
biburl = {https://www.bibsonomy.org/bibtex/201b1d2e8494fc2fb780ea9b38d63e871/csaba},
booktitle = {INFOCOM},
date-added = {2010-11-25 01:20:01 -0700},
date-modified = {2012-06-03 14:12:25 -0600},
interhash = {70052ad99da7e16f7a5c381ca7b29a68},
intrahash = {01b1d2e8494fc2fb780ea9b38d63e871},
keywords = {bandits bandits, networking, networks, stochastic theory, wireless},
month = {April},
pages = {1152--1160},
pdf = {papers/infocom11_final.pdf},
timestamp = {2020-03-17T03:03:01.000+0100},
title = {Sequential Learning for Optimal Monitoring of Multi-channel Wireless Networks},
year = 2011
}