{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,28]],"date-time":"2025-03-28T11:15:39Z","timestamp":1743160539553,"version":"3.37.3"},"publisher-location":"Cham","reference-count":26,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319736020"},{"type":"electronic","value":"9783319736037"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-73603-7_23","type":"book-chapter","created":{"date-parts":[[2018,1,12]],"date-time":"2018-01-12T04:13:02Z","timestamp":1515730382000},"page":"279-290","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Improving the Quality of Video-to-Language Models by Optimizing Annotation of the Training Material"],"prefix":"10.1007","author":[{"given":"Laura","family":"P\u00e9rez-Mayos","sequence":"first","affiliation":[]},{"given":"Federico M.","family":"Sukno","sequence":"additional","affiliation":[]},{"given":"Leo","family":"Wanner","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,1,13]]},"reference":[{"key":"23_CR1","unstructured":"Awad, G., et al.: Trecvid 2016: evaluating video search, video event detection, localization, and hyperlinking. In: Proceedings of TRECVID, vol. 2016 (2016)"},{"key":"23_CR2","doi-asserted-by":"crossref","unstructured":"Baroni, M., Dinu, G., Kruszewski, G.: Don\u2019t count, predict! a systematic comparison of context-counting vs. context-predicting semantic vectors. In: ACL, vol. 1, pp. 238\u2013247 (2014)","DOI":"10.3115\/v1\/P14-1023"},{"issue":"3","key":"23_CR3","first-page":"297","volume":"31","author":"R Barzilay","year":"2005","unstructured":"Barzilay, R., McKeown, K.R.: Sentence fusion for multi-document news summarization. CL 31(3), 297\u2013328 (2005)","journal-title":"CL"},{"key":"23_CR4","first-page":"1137","volume":"3","author":"Y Bengio","year":"2003","unstructured":"Bengio, Y., et al.: A neural probabilistic language model. JMLR 3, 1137\u20131155 (2003)","journal-title":"JMLR"},{"key":"23_CR5","doi-asserted-by":"crossref","unstructured":"Bing, L., et al.: Abstractive multi-document summarization via phrase selection and merging. arXiv preprint arXiv:1506.01597 (2015)","DOI":"10.3115\/v1\/P15-1153"},{"key":"23_CR6","unstructured":"Boudin, F., Morin, E.: Keyphrase extraction for n-best reranking in multi-sentence compression. In: NAACL (2013)"},{"key":"23_CR7","doi-asserted-by":"crossref","unstructured":"Cheung, J.C.K., Penn, G.: Unsupervised sentence enhancement for automatic summarization. In: EMNLP, pp. 775\u2013786 (2014)","DOI":"10.3115\/v1\/D14-1085"},{"key":"23_CR8","doi-asserted-by":"crossref","unstructured":"Collobert, R., Weston, J.: A unified architecture for natural language processing: deep neural networks with multitask learning. In: Proceedings of the 25th ICML, pp. 160\u2013167. ACM (2008)","DOI":"10.1145\/1390156.1390177"},{"key":"23_CR9","unstructured":"Elsner, M., Santhanam, D.: Learning to fuse disparate sentences. In: Proceedings of the Workshop on Monolingual Text-To-Text Generation, pp. 54\u201363. ACL (2011)"},{"key":"23_CR10","unstructured":"Filippova, K.: Multi-sentence compression: finding shortest paths in word graphs. In: Proceedings of the 23rd ICCL, pp. 322\u2013330. ACL (2010)"},{"key":"23_CR11","doi-asserted-by":"crossref","unstructured":"Filippova, K., Strube, M.: Sentence fusion via dependency graph compression. In: Proceedings of the CEMNLP, pp. 177\u2013185. ACL (2008)","DOI":"10.3115\/1613715.1613741"},{"key":"23_CR12","unstructured":"Han, L., et al.: UMBC_EBIQUITY-CORE: semantic textual similarity systems. In: * SEM@ NAACL-HLT, pp. 44\u201352 (2013)"},{"key":"23_CR13","doi-asserted-by":"crossref","unstructured":"Iacobacci, I., Pilehvar, M.T., Navigli, R.: SensEmbed: learning sense embeddings for word and relational similarity. In: ACL, vol. 1, pp. 95\u2013105 (2015)","DOI":"10.3115\/v1\/P15-1010"},{"key":"23_CR14","unstructured":"Mikolov, T., et al.: Efficient estimation of word representations in vector space. arXiv preprint arXiv:1301.3781 (2013)"},{"issue":"11","key":"23_CR15","doi-asserted-by":"crossref","first-page":"39","DOI":"10.1145\/219717.219748","volume":"38","author":"GA Miller","year":"1995","unstructured":"Miller, G.A.: WordNet: a lexical database for English. Commun. ACM 38(11), 39\u201341 (1995)","journal-title":"Commun. ACM"},{"key":"23_CR16","doi-asserted-by":"crossref","unstructured":"Mnih, A., Hinton, G.: Three new graphical models for statistical language modelling. In: Proceedings of the 24th ICML, pp. 641\u2013648. ACM (2007)","DOI":"10.1145\/1273496.1273577"},{"key":"23_CR17","unstructured":"Navigli, R., Ponzetto, S.P.: BabelNet: building a very large multilingual semantic network. In: Proceedings of the 48th Annual Meeting of the ACL, pp. 216\u2013225. ACL (2010)"},{"key":"23_CR18","doi-asserted-by":"crossref","unstructured":"Ramanishka, V., et al.: Multimodal video description. In: Proceedings of the 2016 ACM on Multimedia Conference, pp. 1092\u20131096. ACM (2016)","DOI":"10.1145\/2964284.2984066"},{"key":"23_CR19","doi-asserted-by":"crossref","unstructured":"Ramanishka, V., et al.: Top-down visual saliency guided by captions. In: arXiv preprint arXiv:1612.07360 (2016)","DOI":"10.1109\/CVPR.2017.334"},{"key":"23_CR20","unstructured":"Thadani, K., McKeown, K.: Supervised sentence fusion with single-stage inference. In: IJCNLP, pp. 1410\u20131418 (2013)"},{"key":"23_CR21","unstructured":"Turian, J., Ratinov, L., Bengio, Y.: Word representations: a simple and general method for semi-supervised learning. In: Proceedings of the 48th Annual Meeting of the ACL, pp. 384\u2013394. ACL (2010)"},{"key":"23_CR22","unstructured":"Tzouridis, E., Nasir, J.A., Brefeld, U.: Learning to summarise related sentences. In: COLING, pp. 1636\u20131647 (2014)"},{"key":"23_CR23","unstructured":"Vadapalli, R. et al.: SSAS: semantic similarity for abstractive summarization. In: Proceedings of the IJCNLP (2017)"},{"key":"23_CR24","doi-asserted-by":"crossref","unstructured":"Xu, J., et al.: MSR-VTT: A large video description dataset for bridging video and language. In: Proceedings of the IEEE Conference on CVPR, pp. 5288\u20135296 (2016)","DOI":"10.1109\/CVPR.2016.571"},{"key":"23_CR25","doi-asserted-by":"crossref","unstructured":"Yu, M., Dredze, M.: Improving lexical embeddings with semantic knowledge. In: ACL, vol. 2, pp. 545\u2013550 (2014)","DOI":"10.3115\/v1\/P14-2089"},{"key":"23_CR26","unstructured":"Zou, W.Y., et al.: Bilingual word embeddings for phrase-based machine translation. In: EMNLP, pp. 1393\u20131398 (2013)"}],"container-title":["Lecture Notes in Computer Science","MultiMedia Modeling"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-73603-7_23","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,9]],"date-time":"2019-10-09T04:55:56Z","timestamp":1570596956000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-73603-7_23"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783319736020","9783319736037"],"references-count":26,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-73603-7_23","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2018]]}}}