{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,10]],"date-time":"2024-09-10T19:59:02Z","timestamp":1725998342964},"publisher-location":"Cham","reference-count":20,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030033378"},{"type":"electronic","value":"9783030033385"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-030-03338-5_46","type":"book-chapter","created":{"date-parts":[[2018,11,1]],"date-time":"2018-11-01T23:57:42Z","timestamp":1541116662000},"page":"550-559","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Dynamic Delay Based Cyclic Gradient Update Method for Distributed Training"],"prefix":"10.1007","author":[{"given":"Wenhui","family":"Hu","sequence":"first","affiliation":[]},{"given":"Peng","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Qigang","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Zhengdong","family":"Zhou","sequence":"additional","affiliation":[]},{"given":"Hui","family":"Xiang","sequence":"additional","affiliation":[]},{"given":"Mei","family":"Li","sequence":"additional","affiliation":[]},{"given":"Zhongchao","family":"Shi","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,11,3]]},"reference":[{"key":"46_CR1","unstructured":"Dean, J., Corrado, G., Monga, R., et al.: Large scale distributed deep networks. In: NIPS (2012)"},{"key":"46_CR2","unstructured":"Krizhevsky, A.: One weird trick for parallelizing convolutional neural networks. arXiv:1404.5997 (2014)"},{"key":"46_CR3","doi-asserted-by":"crossref","unstructured":"Li, M., et al.: Scaling distributed machine learning with the parameter server. In: OSDI 2014, pp. 583\u2013598 (2014)","DOI":"10.1145\/2640087.2644155"},{"key":"46_CR4","unstructured":"Zhang, H., et al.: Poseidon: an efficient communication architecture for distributed deep learning on GPU clusters. arXiv:1706.03292 (2017)"},{"key":"46_CR5","unstructured":"Chen, T., et al.: MXNet: a flexible and efficient machine learning library for heterogeneous distributed systems. arXiv:1512.01274 (2015)"},{"key":"46_CR6","unstructured":"Abadi, M., Barham, P., Chen, J.M., et al.: TensorFlow: a system for large-scale machine learning. In: 12th USENIX Symposium on Operating Systems Design and Implementation (OSDI 2016), pp. 265\u2013283 (2016)"},{"key":"46_CR7","unstructured":"Agarwal, A., Duchi, J.C.: Distributed delayed stochastic optimization. In: NIPS 2011, 4247 (2011)"},{"key":"46_CR8","unstructured":"Ho, Q., et al.: More effective distributed ML via a stale synchronous parallel parameter server. In: NIPS 2012, pp. 2141\u20132149 (2012)"},{"key":"46_CR9","doi-asserted-by":"crossref","unstructured":"Chen, X., Eversole, A., Li, G., Yu, D., Seide, F.: Pipelined back-propagation for context-dependent deep neural networks. In: Interspeech 2012 (2012)","DOI":"10.21437\/Interspeech.2012-7"},{"key":"46_CR10","doi-asserted-by":"crossref","unstructured":"Seide, F., Fu, H., Droppo, J., Li, G., Yu, D.: 1-bit stochastic gradient descent and application to data-parallel distributed training of speech DNNs. In: Interspeech 2014 (2014)","DOI":"10.21437\/Interspeech.2014-274"},{"key":"46_CR11","doi-asserted-by":"crossref","unstructured":"Strom, N.: Scalable distributed DNN training using commodity GPU cloud computing. In: Interspeech 2015 (2015)","DOI":"10.21437\/Interspeech.2015-354"},{"key":"46_CR12","unstructured":"Lin, Y., Han, S., Mao, H., Wang, Y., Dally, W.J.: Deep gradient compression: reducing the communication bandwidth for distributed training. In: ICLR 2018 (2018)"},{"issue":"3","key":"46_CR13","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"Olga Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Su, H., et al.: ImageNet large scale visual recognition challenge. Int. J. Comput. Vis. 115(3), 211\u2013252 (2015)","journal-title":"International Journal of Computer Vision"},{"key":"46_CR14","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Delving deep into rectifiers: surpassing human-level performance on imagenet classification. In: Proceedings of the 2015 IEEE International Conference on Computer Vision (ICCV), pp. 1026\u20131034 (2015)","DOI":"10.1109\/ICCV.2015.123"},{"key":"46_CR15","doi-asserted-by":"crossref","unstructured":"Bojar, O., Buck, C., Federmann, C., et al.: Findings of the 2015 workshop on statistical machine translation. In: Tenth Workshop on Statistical Machine Translation (2015). http:\/\/www.statmt.org\/wmt15","DOI":"10.18653\/v1\/W15-3001"},{"key":"46_CR16","unstructured":"Vinyals, O., Kaiser, L., Koo, T., et al.: Grammar as a foreign language. In: NIPS 2015, pp. 2773\u20132781 (2015)"},{"key":"46_CR17","doi-asserted-by":"crossref","unstructured":"Li, M., Andersen, D.G., Smola, A.J., Yu, K.: Communication efficient distributed machine learning with the parameter server. In: NIPS 2014, pp. 19\u201327 (2014)","DOI":"10.1145\/2640087.2644155"},{"issue":"1","key":"46_CR18","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1016\/S0893-6080(98)00116-6","volume":"12","author":"N Qian","year":"1999","unstructured":"Qian, N.: On the momentum term in gradient descent learning algorithms. Neural Netw. 12(1), 145\u2013151 (1999)","journal-title":"Neural Netw."},{"issue":"2","key":"46_CR19","first-page":"372","volume":"27","author":"Y Nesterov","year":"1983","unstructured":"Nesterov, Y.: A method of solving a convex programming problem with convergence rate $$\\cal{O} \\left(1 \/ k^{2} \\right)$$. Soviet Math. Doklady 27(2), 372\u2013376 (1983)","journal-title":"Soviet Math. Doklady"},{"key":"46_CR20","unstructured":"Goyal, P., Doll\u00e1r, P., Girshick, R., et al.: Accurate, large minibatch SGD: training ImageNet in 1 hour. arXiv:1706.02677 (2017)"}],"container-title":["Lecture Notes in Computer Science","Pattern Recognition and Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-03338-5_46","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,2]],"date-time":"2023-11-02T00:24:59Z","timestamp":1698884699000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-03338-5_46"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783030033378","9783030033385"],"references-count":20,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-03338-5_46","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"3 November 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"PRCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Chinese Conference on Pattern Recognition and Computer Vision (PRCV)","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Guangzhou","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 November 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 November 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"1","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ccprcv2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/prcv.qyhw.net.cn\/?lang=en&meeting_id=255","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}