We consider the problem of optimally assigning p sniffers to K channels to
monitor the transmission activities in a multi-channel wireless network with
switching costs. The activity of users is initially unknown to the sniffers and
is to be learned along with channel assignment decisions to maximize the
benefits of this assignment, resulting in the fundamental trade-off between
exploration and exploitation. Switching costs are incurred when sniffers change
their channel assignments. As a result, frequent changes are undesirable. We
formulate the sniffer-channel assignment with switching costs as a linear
partial monitoring problem, a super-class of multi-armed bandits. As the number
of arms (sniffer-channel assignments) is exponential, novel techniques are
called for, to allow efficient learning. We use the linear bandit model to
capture the dependency amongst the arms and develop a policy that takes
advantage of this dependency. We prove the proposed Upper Confident Bound-based
(UCB) policy enjoys a logarithmic regret bound in time t that depends
sub-linearly on the number of arms, while its total switching cost grows with log(log(t)).
%0 Journal Article
%1 LeSzeZh14
%A Le, T.
%A Zheng, R.
%A Szepesvári, Cs.
%D 2014
%J IEEE Transactions on Signal Processing
%K area bandits bandits, local monitoring, network networking, networks, stochastic theory, wireless
%P 5919--5929
%T Sequential Learning for Multi-channel Wireless Network Monitoring with Channel Switching Costs
%V 62
%X We consider the problem of optimally assigning p sniffers to K channels to
monitor the transmission activities in a multi-channel wireless network with
switching costs. The activity of users is initially unknown to the sniffers and
is to be learned along with channel assignment decisions to maximize the
benefits of this assignment, resulting in the fundamental trade-off between
exploration and exploitation. Switching costs are incurred when sniffers change
their channel assignments. As a result, frequent changes are undesirable. We
formulate the sniffer-channel assignment with switching costs as a linear
partial monitoring problem, a super-class of multi-armed bandits. As the number
of arms (sniffer-channel assignments) is exponential, novel techniques are
called for, to allow efficient learning. We use the linear bandit model to
capture the dependency amongst the arms and develop a policy that takes
advantage of this dependency. We prove the proposed Upper Confident Bound-based
(UCB) policy enjoys a logarithmic regret bound in time t that depends
sub-linearly on the number of arms, while its total switching cost grows with log(log(t)).
@article{LeSzeZh14,
abstract = {We consider the problem of optimally assigning p sniffers to K channels to
monitor the transmission activities in a multi-channel wireless network with
switching costs. The activity of users is initially unknown to the sniffers and
is to be learned along with channel assignment decisions to maximize the
benefits of this assignment, resulting in the fundamental trade-off between
exploration and exploitation. Switching costs are incurred when sniffers change
their channel assignments. As a result, frequent changes are undesirable. We
formulate the sniffer-channel assignment with switching costs as a linear
partial monitoring problem, a super-class of multi-armed bandits. As the number
of arms (sniffer-channel assignments) is exponential, novel techniques are
called for, to allow efficient learning. We use the linear bandit model to
capture the dependency amongst the arms and develop a policy that takes
advantage of this dependency. We prove the proposed Upper Confident Bound-based
(UCB) policy enjoys a logarithmic regret bound in time t that depends
sub-linearly on the number of arms, while its total switching cost grows with log(log(t)).},
added-at = {2020-03-17T03:03:01.000+0100},
author = {Le, T. and Zheng, R. and Szepesv{\'a}ri, {Cs}.},
bdsk-url-1 = {http://www.azn.nl/rrng/xray/digmam/iwdm98},
biburl = {https://www.bibsonomy.org/bibtex/2ada18ba1950ced06da373a5ca360efaa/csaba},
date-added = {2014-09-07 09:25:42 -0600},
date-modified = {2014-12-06 19:50:07 +0000},
interhash = {8faa46df6c75ef64b982eb2042e112dc},
intrahash = {ada18ba1950ced06da373a5ca360efaa},
journal = {IEEE Transactions on Signal Processing},
keywords = {area bandits bandits, local monitoring, network networking, networks, stochastic theory, wireless},
month = {September},
pages = {5919--5929},
pdf = {papers/zheng-tsp2014.pdf},
timestamp = {2020-03-17T03:03:01.000+0100},
title = {Sequential Learning for Multi-channel Wireless Network Monitoring with Channel Switching Costs},
volume = 62,
year = 2014
}