{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,9]],"date-time":"2024-09-09T06:27:32Z","timestamp":1725863252290},"publisher-location":"Cham","reference-count":24,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319439815"},{"type":"electronic","value":"9783319439822"}],"license":[{"start":{"date-parts":[[2016,8,17]],"date-time":"2016-08-17T00:00:00Z","timestamp":1471392000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1007\/978-3-319-43982-2_27","type":"book-chapter","created":{"date-parts":[[2016,8,16]],"date-time":"2016-08-16T10:26:45Z","timestamp":1471343205000},"page":"307-320","source":"Crossref","is-referenced-by-count":0,"title":["Unsupervised Construction of Quasi-comparable Corpora and Probing for Parallel Textual Data"],"prefix":"10.1007","author":[{"given":"Krzysztof","family":"Wo\u0142k","sequence":"first","affiliation":[]},{"given":"Krzysztof","family":"Marasek","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,8,17]]},"reference":[{"doi-asserted-by":"crossref","unstructured":"Wo\u0142k, K., Marasek, K.: Real-time statistical speech translation.\u00a0New Perspectives in Information Systems and Technologies, vol. 1, pp. 107\u2013113. Springer International Publishing (2014)","key":"27_CR1","DOI":"10.1007\/978-3-319-05951-8_11"},{"unstructured":"Wo\u0142k,\u00a0K., Marasek, K.: Polish\u2013English speech statistical machine translation systems for the IWSLT 2013. In: Proceedings of the 10th International Workshop on Spoken Language Translation, Heidelberg, Germany, pp. 113\u2013119 (2013)","key":"27_CR2"},{"doi-asserted-by":"crossref","unstructured":"Koehn, P.: Statistical Machine Translation. Cambridge University Press (2009)","key":"27_CR3","DOI":"10.1017\/CBO9780511815829"},{"unstructured":"Berrotar\u00e1n, G., Carrascosa, R., Vine, A.: Yalign documentation. Accessed 01 2015","key":"27_CR4"},{"key":"27_CR5","first-page":"34","volume":"2013","author":"C Chu","year":"2013","unstructured":"Chu, C., Nakazawa, T., Kurohashi, S.: Chinese-Japanese parallel sentence extraction from quasi\u2013comparable corpora. ACL 2013, 34 (2013)","journal-title":"ACL"},{"doi-asserted-by":"crossref","unstructured":"Wu, D., Fung, P.: Inversion transduction grammar constraints for mining parallel sentences from quasi-comparable corpora. Natural Language Processing\u2014IJCNLP 2005. Lecture Notes in Computer Science, vol. 3651, pp. 257\u2013268 (2005)","key":"27_CR6","DOI":"10.1007\/11562214_23"},{"unstructured":"Adafree, S.F., deRijke, M.: Finding similar sentences across multiple languages in Wikipedia (2006)","key":"27_CR7"},{"doi-asserted-by":"crossref","unstructured":"Mohammadi, M., and Aghaee, N.Q.: Building bilingual parallel corpora based on Wikipedia (2010)","key":"27_CR8","DOI":"10.1109\/ICCEA.2010.203"},{"unstructured":"Chu, C., Nakazawa, T., Kurohashi, S.: Accurate parallel fragment extraction from quasi\u2013comparable corpora using alignment model and translation lexicon. In: Proceedings of the Sixth International Joint Conference on Natural Language Processing, pp. 1144\u20131150 (2013)","key":"27_CR9"},{"unstructured":"Yasuda, K., Sumita, E.: Method for building sentence-aligned corpus from Wikipedia (2008)","key":"27_CR10"},{"unstructured":"Plamada, M., Volk, M.: Mining for domain-specific parallel texts from the Wikipedia (2013)","key":"27_CR11"},{"unstructured":"Aker, A., Kanoulas, E., Gaizauskas, R.J., A light way to collect comparable corpora from the Web. LREC (2012)","key":"27_CR12"},{"doi-asserted-by":"crossref","unstructured":"Str\u00f6tgen, J., Gertz, M., Junghans, C.: An event-centric model for multilingual document similarity. In: SIGIR\u201911: Proceedings of the 34th International ACM SIGIR Conference on Research and Development in Information Retrieval, Beijing, China, pp. 953\u2013962 (2011)","key":"27_CR13","DOI":"10.1145\/2009916.2010043"},{"issue":"3","key":"27_CR14","first-page":"377","volume":"23","author":"D Wu","year":"1997","unstructured":"Wu, D.: Stochastic inversion transduction grammars and bilingual parsing of parallel corpora. Comput. Linguist. 23(3), 377\u2013403 (1997)","journal-title":"Comput. Linguist."},{"doi-asserted-by":"crossref","unstructured":"Sarikaya, R., Maskey, S., Zhang, R., Jan, E. E., Wang, D., Ramabhadran, B., Roukos, S.: Iterative sentence-pair extraction from quasi-parallel corpora for machine translation. In:\u00a0INTERSPEECH, pp. 432\u2013435 (2009)","key":"27_CR15","DOI":"10.21437\/Interspeech.2009-156"},{"doi-asserted-by":"crossref","unstructured":"Wu, D., Fung, P.: Inversion transduction grammar constraints for mining parallel sentences from quasi-comparable corpora. In:\u00a0Natural Language Processing\u2013IJCNLP 2005, pp. 257\u2013268 (2005)","key":"27_CR16","DOI":"10.1007\/11562214_23"},{"unstructured":"Cettolo, M., Girardi, C., Federico, M.: WIT3: Web inventory of transcribed and translated talks. In: Proceedings of EAMT, Trento, Italy, pp. 261\u2013268 (2012)","key":"27_CR17"},{"unstructured":"Bojar, O., Rosa, R., Tamchyna, A.: Chimera\u2013three heads for English-to-Czech translation. In: Proceedings of the Eighth Workshop on Statistical Machine Translation. Association for Computational Linguistics Sofia, Bulgaria, pp. 90\u201396 (2013)","key":"27_CR18"},{"unstructured":"Musso, G.: Sequence alignment (Needleman-Wunsch, Smith-Waterman). http:\/\/www.cs.utoronto.ca\/~brudno\/bcb410\/lec2notes.pdf","key":"27_CR19"},{"issue":"1998","key":"27_CR20","first-page":"137","volume":"1398","author":"T Joachims","year":"2005","unstructured":"Joachims, T.: Text categorization with support vector machines: learning with many relevant features. Lect. Notes Comput. Sci. 1398(1998), 137\u2013142 (2005)","journal-title":"Lect. Notes Comput. Sci."},{"unstructured":"Wo\u0142k, K., Marasek, K.: A sentence meaning based alignment method for parallel text corpora preparation. Advances in Intelligent Systems and Computing, vol. 275, pp. 107\u2013114. Springer, Madeira Island, Portugal (2014). ISSN 2194-5357. ISBN 978-3-319-05950-1","key":"27_CR21"},{"unstructured":"Roessler R.: A GPU implementation of Needleman-Wunsch. Specifically for use in the Program PyroNoise 2 (2010)","key":"27_CR22"},{"unstructured":"Koehn, P., Haddow, B.: Towards effective use of training data in statistical machine translation. In: WMT\u201912 Proceedings of the Seventh Workshop on Statistical Machine Translation, Stroudsburg, PA, USA, 317\u2013321 (2012)","key":"27_CR23"},{"unstructured":"Clark, J.H., Dyer, C., Lavie, A., Smith, N.A.: Better hypothesis testing for statistical machine translation: controlling for optimizer instability. In: Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies: short papers, vol. 2, pp. 176\u2013181. Association for Computational Linguistics (2011)","key":"27_CR24"}],"container-title":["Advances in Intelligent Systems and Computing","Multimedia and Network Information Systems"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-43982-2_27","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,5]],"date-time":"2022-07-05T22:27:10Z","timestamp":1657060030000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-43982-2_27"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,8,17]]},"ISBN":["9783319439815","9783319439822"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-43982-2_27","relation":{},"ISSN":["2194-5357","2194-5365"],"issn-type":[{"type":"print","value":"2194-5357"},{"type":"electronic","value":"2194-5365"}],"subject":[],"published":{"date-parts":[[2016,8,17]]}}}