{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,8,8]],"date-time":"2024-08-08T07:04:56Z","timestamp":1723100696222},"reference-count":28,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2013,8,10]],"date-time":"2013-08-10T00:00:00Z","timestamp":1376092800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Front. Comput. Sci."],"published-print":{"date-parts":[[2013,10]]},"DOI":"10.1007\/s11704-013-2291-3","type":"journal-article","created":{"date-parts":[[2013,8,9]],"date-time":"2013-08-09T20:45:06Z","timestamp":1376081106000},"page":"754-766","source":"Crossref","is-referenced-by-count":8,"title":["Reinforcement learning models for scheduling in wireless networks"],"prefix":"10.1007","volume":"7","author":[{"given":"Kok-Lim Alvin","family":"Yau","sequence":"first","affiliation":[]},{"given":"Kae Hsiang","family":"Kwong","sequence":"additional","affiliation":[]},{"given":"Chong","family":"Shen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2013,8,10]]},"reference":[{"key":"2291_CR1","volume-title":"Reinforcement learning: an introduction","author":"R S Sutton","year":"1998","unstructured":"Sutton R S, Barto A G. Reinforcement learning: an introduction. US: MIT Press, 1998"},{"issue":"1","key":"2291_CR2","doi-asserted-by":"crossref","first-page":"197","DOI":"10.1287\/opre.50.1.197.17783","volume":"50","author":"S J Stidham","year":"2002","unstructured":"Stidham S J. Applied probability in operations research: a retrospective\/\/Preprint: analysis, design, and control of queueing systems. Operation Research, 2002, 50(1): 197\u2013216","journal-title":"Operation Research"},{"issue":"7","key":"2291_CR3","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1109\/MCOM.2012.6231288","volume":"50","author":"M S Thompson","year":"2012","unstructured":"Thompson M S, Mackenzie A B, Dasilva L A, Hadjichristofi G. A mobile ad hoc networking competition: a retrospective look at the MANIAC challenge. IEEE Communications Magazine, 2012, 50(7): 121\u2013127","journal-title":"IEEE Communications Magazine"},{"issue":"7","key":"2291_CR4","doi-asserted-by":"crossref","first-page":"147","DOI":"10.1109\/MCOM.2012.6231291","volume":"50","author":"X Li","year":"2012","unstructured":"Li X, Falcon R, Nayak A, Stojmenovic I. Servicing wireless sensor networks by mobile robots. IEEE Communications Magazine, 2012, 50(7): 147\u2013154","journal-title":"IEEE Communications Magazine"},{"key":"2291_CR5","doi-asserted-by":"crossref","first-page":"2045","DOI":"10.1109\/WCNC.2008.363","volume-title":"Proceedings of the 2008 IEEE Wireless Communications and Networking Conference","author":"Y Xue","year":"2008","unstructured":"Xue Y, Lin Y, Cai H, Chi C. Autonomic joint session scheduling strategies for heterogeneous wireless networks. In: Proceedings of the 2008 IEEE Wireless Communications and Networking Conference. 2008, 2045\u20132050"},{"issue":"1","key":"2291_CR6","doi-asserted-by":"crossref","first-page":"23","DOI":"10.1109\/MWC.2012.6155873","volume":"19","author":"M Song","year":"2012","unstructured":"Song M, Xin C, Zhao Y, Cheng X. Dynamic spectrum access: from cognitive radio to network radio. IEEE Wireless Communications, 2012, 19(1): 23\u201329","journal-title":"IEEE Wireless Communications"},{"key":"2291_CR7","first-page":"4708","volume-title":"Proceedings of the 2009 Chinese Control and Decision Conference","author":"J Mao","year":"2009","unstructured":"Mao J, Xiang F, Lai H. RL-based superframe order adaptation algorithm for IEEE 802.15.4 networks. In: Proceedings of the 2009 Chinese Control and Decision Conference. 2009, 4708\u20134711"},{"key":"2291_CR8","first-page":"1","volume-title":"Proceedings of the 4th International Conference on Mobile Ad-hoc and Sensor Systems","author":"K Shah","year":"2007","unstructured":"Shah K, Kumar M. Distributed independent reinforcement learning (DIRL) approach to resource management in wireless sensor networks. In: Proceedings of the 4th International Conference on Mobile Ad-hoc and Sensor Systems. 2007, 1\u20139"},{"key":"2291_CR9","first-page":"253","volume-title":"Proceedings of the 2010 International Conference on Future Computer and Communication","author":"J Niu","year":"2010","unstructured":"Niu J. Self-learning scheduling approach for wireless sensor network. In: Proceedings of the 2010 International Conference on Future Computer and Communication. 2010, 253\u2013257"},{"key":"2291_CR10","doi-asserted-by":"crossref","first-page":"237","DOI":"10.1613\/jair.301","volume":"4","author":"L P Kaelbling","year":"1996","unstructured":"Kaelbling L P, Littman M L, Wang X. Reinforcement learning: a survey. Journal of Artificial Intelligence Research, 1996, 4: 237\u2013285","journal-title":"Journal of Artificial Intelligence Research"},{"key":"2291_CR11","first-page":"392","volume-title":"Proceedings of the 9th International Conference on Innovations in Information Technology","author":"M Bourenane","year":"2011","unstructured":"Bourenane M. Adaptive scheduling in mobile ad hoc networks using reinforcement learning approach. In: Proceedings of the 9th International Conference on Innovations in Information Technology. 2011, 392\u2013397"},{"key":"2291_CR12","first-page":"1","volume-title":"Proceedings of the 2011 International Conference on Computer Communication Networks","author":"M D Felice","year":"2011","unstructured":"Felice M D, Chowdhury K R, Kassler A, Bononi L. Adaptive sensing scheduling and spectrum selection in cognitive wireless mesh networks. In: Proceedings of the 2011 International Conference on Computer Communication Networks. 2011, 1\u20136"},{"key":"2291_CR13","first-page":"140","volume-title":"Proceedings of the 20th Conference on Software, Telecomm, Computer Networks","author":"S Zouaidi","year":"2008","unstructured":"Zouaidi S, Mellouk A, Bourennane M, Hoceini S. Design and performance analysis of inductive QoS scheduling for dynamic network routing. In: Proceedings of the 20th Conference on Software, Telecomm, Computer Networks. 2008, 140\u2013146"},{"issue":"6","key":"2291_CR14","doi-asserted-by":"crossref","first-page":"172","DOI":"10.1109\/MCOM.2011.5784003","volume":"49","author":"O Sallent","year":"2011","unstructured":"Sallent O, P\u00e9rez-Romero J, S\u00e1nchez-Gonz\u00e1lez J, Agust\u00ed R, D\u00edazguerra MA, Henche D, Paul D. A roadmap from UMTS optimization to LTE self-optimization. IEEE Communications Magazine, 2011, 49(6): 172\u2013182","journal-title":"IEEE Communications Magazine"},{"issue":"2","key":"2291_CR15","doi-asserted-by":"crossref","first-page":"401","DOI":"10.1109\/TMM.2011.2173477","volume":"14","author":"H Bobarshad","year":"2012","unstructured":"Bobarshad H, van der Schaar M, Aghvami A H, Dilmaghani R S, Shikh-Bahaei M R. Analytical modeling for delay-sensitive video over WLAN. IEEE Transactions on Multimedia, 2012, 14(2): 401\u2013414","journal-title":"IEEE Transactions on Multimedia"},{"key":"2291_CR16","first-page":"768","volume-title":"Proceedings of the 2006 Conference on Networking, Sensing and Control","author":"Z Liu","year":"2006","unstructured":"Liu Z, Elhanany I. RL-MAC: a QoS-aware reinforcement learning based MAC protocol for wireless sensor networks. In: Proceedings of the 2006 Conference on Networking, Sensing and Control. 2006, 768\u2013773"},{"key":"2291_CR17","first-page":"2276","volume-title":"Proceedings of the 65th IEEE Vehicular Technology Conference","author":"R Yu","year":"2007","unstructured":"Yu R, Sun Z, Mei S. Packet scheduling in broadband wireless networks using neuro-dynamic programming. In: Proceedings of the 65th IEEE Vehicular Technology Conference. 2007, 2276\u20132780"},{"key":"2291_CR18","first-page":"895","volume-title":"Proceedings of the 2012 IEEE International Conference on Pervasive Computing and Communications","author":"M I Khan","year":"2012","unstructured":"Khan M I, Rinner B. Resource coordination in wireless sensor net works by cooperative reinforcement learning. In: Proceedings of the 2012 IEEE International Conference on Pervasive Computing and Communications. 2012, 895\u2013900"},{"key":"2291_CR19","first-page":"1789","volume":"7","author":"J R Kok","year":"2006","unstructured":"Kok J R, Vlassis N. Collaborative multiagent reinforcement learning by payoff propagation. Journal of Machine Learning Research, 2006, 7: 1789\u20131828","journal-title":"Journal of Machine Learning Research"},{"key":"2291_CR20","first-page":"371","volume-title":"Proceedings of the 16th Conference on Machine Learning","author":"J Schneider","year":"1999","unstructured":"Schneider J, Wong W-K, Moore A, Riedmiller M, Distributed value functions. In: Proceedings of the 16th Conference on Machine Learning. 1999, 371\u2013378"},{"issue":"4","key":"2291_CR21","doi-asserted-by":"crossref","first-page":"366","DOI":"10.1109\/LCOM.2007.348303","volume":"11","author":"A Sahoo","year":"2007","unstructured":"Sahoo A, Manjunath D. Revisiting WFQ: minimum packet lengths tighten delay and fairness bounds. IEEE Communications Letters, 2007, 11(4): 366\u2013368","journal-title":"IEEE Communications Letters"},{"issue":"8","key":"2291_CR22","doi-asserted-by":"crossref","first-page":"1163","DOI":"10.1049\/iet-com.2010.0378","volume":"5","author":"H Yu","year":"2011","unstructured":"Yu H, Ding L, Liu N, Pan Z, Wu P, You X. Enhanced first-in-first-outbased round-robin multicast scheduling algorithm for input-queued switches. IET Communications, 2011, 5(8): 1163\u20131171","journal-title":"IET Communications"},{"key":"2291_CR23","first-page":"152","volume-title":"Proceedings of the 2010 Conference on Local Computer Networks","author":"K L A Yau","year":"2010","unstructured":"Yau K L A, Komisarczuk P, Teal P D. Enhancing network performance in distributed cognitive radio networks using single-agent and multi-agent reinforcement learning. In: Proceedings of the 2010 Conference on Local Computer Networks. 2010, 152\u2013159"},{"key":"2291_CR24","volume-title":"Proceedings of Massachusetts Institute of Technology ESD Internal Symposium","author":"Engineering Systems Division ESD.","year":"2002","unstructured":"Engineering Systems Division (ESD). ESD Symposium Committee Overview. In: Proceedings of Massachusetts Institute of Technology ESD Internal Symposium. 2002. http:\/\/esd.mit.edu\/WPS"},{"key":"2291_CR25","first-page":"479","volume-title":"Proceedings of the 33rd International Conference on Information and Communication Technology. Electronics and Microelectronics","author":"D Ouzecki","year":"2010","unstructured":"Ouzecki D, Jevtic D. Reinforcement learning as adaptive network routing of mobile agents. In: Proceedings of the 33rd International Conference on Information and Communication Technology. Electronics and Microelectronics. 2010, 479\u2013484"},{"issue":"1","key":"2291_CR26","doi-asserted-by":"crossref","first-page":"243","DOI":"10.1109\/TNET.2011.2159844","volume":"20","author":"A A Bhorkar","year":"2012","unstructured":"Bhorkar A A, Naghshvar M, Javidi T, Rao B D. Adaptive opportunistic routing for wireless ad hoc networks. IEEE\/ACM Transactions on Network, 2012, 20(1): 243\u2013256","journal-title":"IEEE\/ACM Transactions on Network"},{"issue":"1","key":"2291_CR27","doi-asserted-by":"crossref","first-page":"102","DOI":"10.1109\/TWC.2010.111910.091238","volume":"10","author":"Z Lin","year":"2011","unstructured":"Lin Z, Schaar M V D. Autonomic and distributed joint routing and power control for delay-sensitive applications in multi-hop wireless networks. IEEE Transactions on Wireless Communications, 2011, 10(1): 102\u2013113","journal-title":"IEEE Transactions on Wireless Communications"},{"key":"2291_CR28","doi-asserted-by":"crossref","first-page":"1233","DOI":"10.1109\/ICRTIT.2011.5972411","volume-title":"Proceedings of the 2011 International Conference on Recent Trends in Information Technology","author":"G Santhi","year":"2011","unstructured":"Santhi G, Nachiappan A, Ibrahime M Z, Raghunadhane R, Favas M K. Q-learning based adaptive QoS routing protocol for MANETs. In: Proceedings of the 2011 International Conference on Recent Trends in Information Technology. 2011, 1233\u20131238"}],"container-title":["Frontiers of Computer Science"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11704-013-2291-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11704-013-2291-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11704-013-2291-3","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,7,20]],"date-time":"2019-07-20T15:31:11Z","timestamp":1563636671000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11704-013-2291-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,8,10]]},"references-count":28,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2013,10]]}},"alternative-id":["2291"],"URL":"https:\/\/doi.org\/10.1007\/s11704-013-2291-3","relation":{},"ISSN":["2095-2228","2095-2236"],"issn-type":[{"value":"2095-2228","type":"print"},{"value":"2095-2236","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,8,10]]}}}