{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,8,10]],"date-time":"2024-08-10T05:16:48Z","timestamp":1723267008318},"reference-count":37,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2014,12,28]],"date-time":"2014-12-28T00:00:00Z","timestamp":1419724800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Computing"],"published-print":{"date-parts":[[2015,11]]},"DOI":"10.1007\/s00607-014-0438-1","type":"journal-article","created":{"date-parts":[[2014,12,27]],"date-time":"2014-12-27T06:20:48Z","timestamp":1419661248000},"page":"1045-1075","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":34,"title":["Application of reinforcement learning to wireless sensor networks: models and algorithms"],"prefix":"10.1007","volume":"97","author":[{"given":"Kok-Lim Alvin","family":"Yau","sequence":"first","affiliation":[]},{"given":"Hock Guan","family":"Goh","sequence":"additional","affiliation":[]},{"given":"David","family":"Chieng","sequence":"additional","affiliation":[]},{"given":"Kae Hsiang","family":"Kwong","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2014,12,28]]},"reference":[{"issue":"10","key":"438_CR1","doi-asserted-by":"crossref","first-page":"90","DOI":"10.1109\/MCOM.2011.6035821","volume":"49","author":"DS Ghataoura","year":"2011","unstructured":"Ghataoura DS, Mitchell JE, Matich GE (2011) Networking and application interface technology for wireless sensor network surveillance and monitoring. IEEE Comm Magazine 49(10):90\u201397","journal-title":"IEEE Comm Magazine"},{"key":"438_CR2","volume-title":"Reinforcement learning: an introduction","author":"RS Sutton","year":"1998","unstructured":"Sutton RS, Barto AG (1998) Reinforcement learning: an introduction. MIT Press, Cambridge"},{"key":"438_CR3","doi-asserted-by":"crossref","unstructured":"Zhang D, Ma H (2007) A Q-learning-based decision making scheme for application reconfiguration in sensor networks. CSCWD\u201907 proc 11th Intl Conf Comp Supported Cooperative Work in Design. IEEE, Melbourne, Australia, pp 1122\u20131127","DOI":"10.1109\/CSCWD.2007.4281598"},{"key":"438_CR4","doi-asserted-by":"crossref","unstructured":"Seah MWS, Tham CK, Srinivasan V, Xin A (2007) Achieving coverage through distributed reinforcement learning in wireless sensor networks. ISSNIP\u201907 proc 3rd Intl Conf Intell Sensors, Sensor Net and Info. IEEE, Melbourne, Australia, pp 425\u2013430","DOI":"10.1109\/ISSNIP.2007.4496881"},{"key":"438_CR5","doi-asserted-by":"crossref","unstructured":"Dong S, Agrawal P, Sivalingam K (2007) Reinforcement learning based geographic routing protocol for UWB wireless sensor network. GLOBECOM\u201907 proc Global Telecomm Conf. IEEE, Washington, DC, pp 652\u2013656","DOI":"10.1109\/GLOCOM.2007.127"},{"issue":"1","key":"438_CR6","doi-asserted-by":"crossref","first-page":"253","DOI":"10.1016\/j.jnca.2011.08.007","volume":"35","author":"K-LA Yau","year":"2012","unstructured":"Yau K-LA, Komisarczuk P, Teal PD (2012) Reinforcement learning for context awareness and intelligence in wireless networks. Elsevier J Net Comp App 35(1):253\u2013267","journal-title":"Elsevier J Net Comp App"},{"key":"438_CR7","doi-asserted-by":"crossref","unstructured":"Chu Y, Mitchell PD, Grace D (2012) Reinforcement learning based ALOHA for multi-hop wireless sensor networks with informed receiving. WSS\u201912 proc IET Conf Wls Sensor Sys. IEEE, London, UK, pp 1\u20136","DOI":"10.1049\/cp.2012.0582"},{"issue":"3\/4","key":"438_CR8","doi-asserted-by":"crossref","first-page":"117","DOI":"10.1504\/IJSNET.2006.012027","volume":"1","author":"Z Liu","year":"2006","unstructured":"Liu Z, Elhanany I (2006) RL-MAC: a reinforcement learning based MAC protocol for wireless sensor networks. Inderscience Intl J Sensor Net 1(3\/4):117\u2013124","journal-title":"Inderscience Intl J Sensor Net"},{"key":"438_CR9","unstructured":"Mao J, Xiang F, Lai H (2009) RL-based superframe order adaptation algorithm for IEEE 802.15.4 networks. In: CCDC\u201909 proc Ch Ctrl and Decision Conf. IEEE, Guilin, China, pp 1\u20135"},{"issue":"7","key":"438_CR10","doi-asserted-by":"crossref","first-page":"1094","DOI":"10.1109\/JSAC.2010.100914","volume":"28","author":"J Gummeson","year":"2010","unstructured":"Gummeson J, Ganesan D, Corner MD, Shenoy P (2010) An adaptive link layer for heterogeneous multi-radio mobile sensor networks. IEEE J Sel Area Comm 28(7):1094\u20131104","journal-title":"IEEE J Sel Area Comm"},{"key":"438_CR11","doi-asserted-by":"crossref","unstructured":"Hsu RC, Liu CT, Wang KC, Lee WM (2009) QoS-aware power management for energy harvesting wireless sensor network utilizing reinforcement learning. CSE\u201909 proc Intl Conf Comp Sc and Engin. IEEE, Vancouver, Canada, pp 537\u2013542","DOI":"10.1109\/CSE.2009.83"},{"issue":"17","key":"438_CR12","doi-asserted-by":"crossref","first-page":"2094","DOI":"10.1016\/j.comcom.2011.06.010","volume":"34","author":"K Shah","year":"2011","unstructured":"Shah K, Francesco MD, Anastasi G, Kumar M (2011) A framework for resource-aware data accumulation in sparse wireless sensor networks. Elsevier J Comp Comm 34(17):2094\u20132103","journal-title":"Elsevier J Comp Comm"},{"issue":"2","key":"438_CR13","doi-asserted-by":"crossref","first-page":"98","DOI":"10.1504\/IJSNET.2010.034619","volume":"8","author":"X Liang","year":"2010","unstructured":"Liang X, Chen M, Xiao Y, Balasingham I, Leung VCM (2010) MRL-CC: a novel cooperative communication protocol for QoS provisioning in wireless sensor networks. Inderscience Intl J Sensor Net 8(2):98\u2013108","journal-title":"Inderscience Intl J Sensor Net"},{"key":"438_CR14","doi-asserted-by":"crossref","unstructured":"Forster A, Murphy AL (2009) Clique: role-free clustering with Q-learning for wireless sensor networks. ICDCS\u201909 proceedings 29th IEEE Intl Conf Dist Comp Sys. IEEE, Quebec, Canada, pp 441\u2013449","DOI":"10.1109\/ICDCS.2009.43"},{"key":"438_CR15","unstructured":"Saoseng JY, Tham CK (2006) Coordinated rate control in wireless sensor network. ICCS\u201906 proc 10 $$^{th}$$ t h IEEE Singapore Intl Conf Comm Sys. IEEE, Singapore, pp 1\u20135"},{"key":"438_CR16","unstructured":"Tan H, Zhao L, Liu W, Niu Y, Zhao C (2011) Adaptive congestion avoidance scheme based on reinforcement learning for wireless sensor network. ICCTA\u201911 proc IET Intl Conf Comm Tech and App. IEEE, Beijing, China, pp 228\u2013232"},{"key":"438_CR17","unstructured":"Tham CK, Renaud JC (2005) Multi-agent systems on sensor networks: a distributed reinforcement learning approach. ISSNIP\u201905 proc Intl Conf Intell Sensors, Sensor Net and Info. IEEE, Melbourne, Australia, pp 423\u2013429"},{"key":"438_CR18","unstructured":"Khan MI, Rinner B (2012) Resource coordination in wireless sensor networks by cooperative reinforcement learning. PERCOMW\u201912 proc IEEE Intl Conf Pervasive Comp and Comm Workshops. IEEE, Lugano, Switzerland, pp 895\u2013900"},{"key":"438_CR19","doi-asserted-by":"crossref","unstructured":"Mahadevan S (1994) To discount or not to discount in reinforcement learning: a case study comparing R learning and Q learning. ICML\u201994: Proceedings of the 11th International Conference on Machine Learning. Morgan Kaufmann, Amherst, MA, pp 164\u2013172","DOI":"10.1016\/B978-1-55860-335-6.50028-3"},{"key":"438_CR20","unstructured":"Mao S, Tang H, Zhou L, Ma X (2011) An energy conservation optimization strategy for wireless sensor network node based on Q-learning. ASCC\u201911 proc Asian Ctrl Conf. IEEE, Kaohsiung, Taiwan, pp 938\u2013943"},{"key":"438_CR21","doi-asserted-by":"crossref","unstructured":"Alberola RdP, Pesch D (2012) Duty cycle learning algorithm (DCLA) for IEEE 802.15.4 beacon-enabled wireless sensor networks. Elsevier Ad Hoc Net 10(4):664\u2013679","DOI":"10.1016\/j.adhoc.2011.06.006"},{"key":"438_CR22","doi-asserted-by":"crossref","unstructured":"Arroyo-Valles R, Alaiz-Rodriguez R, Guerrero-Curieses A, Cid-Sueiro J (2007) Q-probabilistic routing in wireless sensor networks. ISSNIP\u201907: Proc 3rd Intl Conf Intell Sensors, Sensor Net and Info. IEEE, Melbourne, Australia, pp 1\u20136","DOI":"10.1109\/ISSNIP.2007.4496810"},{"issue":"5","key":"438_CR23","doi-asserted-by":"crossref","first-page":"940","DOI":"10.1016\/j.adhoc.2010.11.006","volume":"9","author":"A Forster","year":"2011","unstructured":"Forster A, Murphy AL (2011) FROMS: a failure tolerant and mobility enabled multicast routing paradigm with reinforcement learning for WSNs. Elsevier Ad Hoc Net 9(5):940\u2013965","journal-title":"Elsevier Ad Hoc Net"},{"issue":"3","key":"438_CR24","doi-asserted-by":"crossref","first-page":"458","DOI":"10.1016\/j.adhoc.2011.07.015","volume":"10","author":"BC Villaverde","year":"2012","unstructured":"Villaverde BC, Rea S, Pesch D (2012) InRout: a QoS aware route selection algorithm for industrial wireless sensor networks. Elsevier Ad Hoc Net 10(3):458\u2013478","journal-title":"Elsevier Ad Hoc Net"},{"key":"438_CR25","doi-asserted-by":"crossref","unstructured":"Hu T, Fei Y (2012) MURAO: a multi-level routing protocol for acoustic-optical hybrid underwater wireless sensor networks. SECON\u201912 proc 9th Ann IEEE Comm Soc Conf Sensor, Mesh and Ad hoc Comm and Net. IEEE, Seoul, South Korea, pp 218\u2013226","DOI":"10.1109\/SECON.2012.6275781"},{"key":"438_CR26","unstructured":"Liang X, Balasingham I, Byun SS (2008) A multi-agent reinforcement learning based routing protocol for wireless sensor networks. ISWCS\u201908 proc IEEE Intl Symp on Wls Comm Sys. IEEE, Reykjavik, Iceland, pp 552\u2013557"},{"key":"438_CR27","unstructured":"Liang X, Balasingham I, Byun SS (2008) A reinforcement learning based routing protocol with QoS support for biomedical sensor networks. ISABEL\u201908 proc 1st Intl Symp App Sc and Biomedical and Comm Tech. IEEE, Aalborg, Denmark, pp 1\u20135"},{"key":"438_CR28","doi-asserted-by":"crossref","unstructured":"Naputta Y, Usaha W (2012) RL-based routing in biomedical mobile wireless sensor networks using trust and reputation. ISWCS\u201912 proc 9th Intl Symp Wls Comm Sys. IEEE, Paris, France, pp 521\u2013525","DOI":"10.1109\/ISWCS.2012.6328422"},{"key":"438_CR29","doi-asserted-by":"crossref","unstructured":"Chu Y, Mitchell PD, Grace D (2012) ALOHA and Q-learning based medium access control for wireless sensor networks. ISWCS\u201912 proc Intl Symp Wls Comm Sys. IEEE, Paris, France, pp 511\u2013515","DOI":"10.1109\/ISWCS.2012.6328420"},{"issue":"3\/4","key":"438_CR30","first-page":"207","volume":"9","author":"M Mihaylov","year":"2012","unstructured":"Mihaylov M, Borgne YAL, Tuyls K, Nowe A (2012) Decentralised reinforcement learning for energy-efficient scheduling in wireless sensor networks. Inderscience Intl J Comm Net Distrib Sys 9(3\/4):207\u2013224","journal-title":"Inderscience Intl J Comm Net Distrib Sys"},{"key":"438_CR31","doi-asserted-by":"crossref","unstructured":"Niu J, Deng Z (2013) Distributed self-learning scheduling approach for wireless sensor network. Elsevier Ad Hoc Net 11(4):1276\u20131286","DOI":"10.1016\/j.adhoc.2010.11.004"},{"key":"438_CR32","doi-asserted-by":"crossref","unstructured":"Liang X, Chen M, Leung VCM, Balasingham I (2010) Soft QoS provisioning for wireless sensor networks: a cooperative communications approach.In: CHINACOM\u201910: Proceedings of 5th Intl ICST Conf Commu and Net in China. IEEE, Beijing, China, pp 1\u20138","DOI":"10.4108\/chinacom.2010.113"},{"key":"438_CR33","doi-asserted-by":"crossref","unstructured":"Liang X, Balasingham I, Leung VCM (2009) Cooperative communications with relay selection for QoS provisioning in wireless sensor networks. GLOBECOM\u201909 proc Global Telecomm Conf. IEEE, Honolulu, Hawaii, pp 1\u20138","DOI":"10.1109\/GLOCOM.2009.5425437"},{"key":"438_CR34","doi-asserted-by":"crossref","unstructured":"Maalej M, Besbes H, Cherif S (2012) A cooperative communication protocol for saving energy consumption in WSNs. ComNet\u201912 proc Intl Conf Comm and Net. IEEE, Kunming, China, pp 1\u20135","DOI":"10.1109\/ComNet.2012.6217725"},{"key":"438_CR35","doi-asserted-by":"crossref","unstructured":"Renaud JC, Tham CK (2006) Coordinated sensing coverage in sensor networks using distributed reinforcement learning. ICON\u201906 proc 14th IEEE Intl Conf Net. IEEE, Singapore, pp 1\u20136","DOI":"10.1109\/ICON.2006.302580"},{"issue":"6","key":"438_CR36","doi-asserted-by":"crossref","first-page":"796","DOI":"10.1109\/TMC.2010.28","volume":"9","author":"T Hu","year":"2010","unstructured":"Hu T, Fei Y (2010) QELAR: a machine-learning-based adaptive routing protocol for energy-efficient and lifetime-extended underwater sensor networks. IEEE Trans Mob Comp 9(6):796\u2013809","journal-title":"IEEE Trans Mob Comp"},{"key":"438_CR37","doi-asserted-by":"crossref","unstructured":"Yau K-LA, Komisarczuk P, Teal PD (2011) Achieving context awareness and intelligence in distributed cognitive radio networks: a payoff propagation approach. In: WAINA\u201911 proc IEEE Workshops Intl Conf Ad Info Net and App. IEEE, Singapore","DOI":"10.1109\/WAINA.2011.47"}],"container-title":["Computing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00607-014-0438-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00607-014-0438-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00607-014-0438-1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,8,19]],"date-time":"2019-08-19T01:23:54Z","timestamp":1566177834000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00607-014-0438-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,12,28]]},"references-count":37,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2015,11]]}},"alternative-id":["438"],"URL":"https:\/\/doi.org\/10.1007\/s00607-014-0438-1","relation":{},"ISSN":["0010-485X","1436-5057"],"issn-type":[{"value":"0010-485X","type":"print"},{"value":"1436-5057","type":"electronic"}],"subject":[],"published":{"date-parts":[[2014,12,28]]}}}