{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T23:34:52Z","timestamp":1743118492178,"version":"3.40.3"},"publisher-location":"Cham","reference-count":40,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319420912"},{"type":"electronic","value":"9783319420929"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-42092-9_42","type":"book-chapter","created":{"date-parts":[[2016,6,30]],"date-time":"2016-06-30T10:02:55Z","timestamp":1467280975000},"page":"552-566","source":"Crossref","is-referenced-by-count":1,"title":["An Innovative Similarity Measure for Sentence Plagiarism Detection"],"prefix":"10.1007","author":[{"given":"Agnese","family":"Augello","sequence":"first","affiliation":[]},{"given":"Alfredo","family":"Cuzzocrea","sequence":"additional","affiliation":[]},{"given":"Giovanni","family":"Pilato","sequence":"additional","affiliation":[]},{"given":"Carmelo","family":"Spiccia","sequence":"additional","affiliation":[]},{"given":"Giorgio","family":"Vassallo","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,7,1]]},"reference":[{"key":"42_CR1","doi-asserted-by":"crossref","unstructured":"Dolan, B., Quirk, C., Brockett, C.: Unsupervised construction of large paraphrase corpora: exploiting massively parallel news sources, In: Proceedings of the 20th International Conference on Computational Linguistics (COLING), Geneva, Switzerland, pp. 350\u2013356 (2004)","DOI":"10.3115\/1220355.1220406"},{"key":"42_CR2","doi-asserted-by":"crossref","unstructured":"Hassan, S.: Measuring semantic relatedness using salient encyclopedic concepts. Ph.D. thesis, University of Texas (2011)","DOI":"10.1609\/aaai.v25i1.7971"},{"key":"42_CR3","unstructured":"Ji, Y., Eisenstein, J.: Discriminative improvements to distributional sentence similarity. In: Proceedings of Empirical Methods in Natural Language Processing (EMNLP), Seattle, Washington, USA, pp. 891\u2013896 (2013)"},{"issue":"8","key":"42_CR4","first-page":"707","volume":"10","author":"VI Levenshtein","year":"1966","unstructured":"Levenshtein, V.I.: Binary codes capable of correcting deletions, insertions, and reversals. Sov. Phys. Dokl. 10(8), 707\u2013710 (1966)","journal-title":"Sov. Phys. Dokl."},{"key":"42_CR5","doi-asserted-by":"crossref","unstructured":"Morris, A.C., Maier, V., Green, P.: From WER and RIL to MER and WIL: improved evaluation measures for connected speech recognition. In: INTERSPEECH (2004)","DOI":"10.21437\/Interspeech.2004-668"},{"issue":"2","key":"42_CR6","first-page":"57","volume":"18","author":"RD Burke","year":"1997","unstructured":"Burke, R.D., Hammond, K.J., Kulyukin, V., Lytinen, S.L., Tomuro, N., Schoenberg, S.: Question answering from frequently asked question files: experiences with the FAQ finder system. AI Mag. 18(2), 57\u201366 (1997)","journal-title":"AI Mag."},{"issue":"4","key":"42_CR7","doi-asserted-by":"crossref","first-page":"7764","DOI":"10.1016\/j.eswa.2008.11.022","volume":"36","author":"RM Aliguliyev","year":"2009","unstructured":"Aliguliyev, R.M.: A new sentence similarity measure and sentence based extractive technique for automatic text summarization. Expert Syst. Appl. 36(4), 7764\u20137772 (2009)","journal-title":"Expert Syst. Appl."},{"key":"42_CR8","doi-asserted-by":"crossref","first-page":"457","DOI":"10.1613\/jair.1523","volume":"22","author":"G Erkan","year":"2004","unstructured":"Erkan, G., Radev, D.R.: LexRank: graph-based lexical centrality as salience in text summarization. J. Artif. Intell. Res. 22, 457\u2013479 (2004)","journal-title":"J. Artif. Intell. Res."},{"key":"42_CR9","unstructured":"Liu, D., Gildea, D.: Syntactic features for evaluation of machine translation. In: Proceedings of the ACL Workshop on Intrinsic and Extrinsic Evaluation Measures for Machine Translation and\/or Summarization, pp. 25\u201332 (2005)"},{"key":"42_CR10","unstructured":"Madnani, N., Tetreault, J., Chodorow, M.: Re-examining machine transla-tion metrics for paraphrase identification. In: Proceedings of the 2012 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (NAACL HLT 2012), pp. 182-190. Association for Computa-tional Linguistics (2012)"},{"key":"42_CR11","unstructured":"Niwattanakul, S., Singthongchai, J., Naenudorn, E., Wanapu, S.: Using of Jaccard coefficient for keywords similarity. In: Proceedings of the International MultiConference of Engineers and Computer Scientists (IMECS), vol. 1, pp. 380\u2013384 (2013)"},{"key":"42_CR12","doi-asserted-by":"crossref","unstructured":"Papineni, K., Roukos, S., Ward, T., Zhu, W.J.: BLEU: a method for automatic evaluation of machine translation. In: Proceedings of the 40th Annual Meeting on Association for Computational Linguistics (ACL), pp. 311\u2013318. Association for Computational Linguistics (2002)","DOI":"10.3115\/1073083.1073135"},{"key":"42_CR13","doi-asserted-by":"crossref","unstructured":"Doddington, G.: Automatic evaluation of machine translation quality using n-gram co-occurrence statistics. In: Proceedings of the Second International Conference on Human Language Technology Research (HLT), pp. 138\u2013145 (2002)","DOI":"10.3115\/1289189.1289273"},{"key":"42_CR14","unstructured":"Snover, M., Dorr, B., Schwartz, R., Micciulla, L., Makhoul, J.: A study of translation edit rate with targeted human annotation. In: Proceedings of the Seventh Conference of the Association for Machine Translation in the Americas (AMTA), pp. 223\u2013231 (2006)"},{"key":"42_CR15","unstructured":"Snover, M., Madnani, N., Dorr, B., Schwartz, R.: TERp system description. In: Proceedings of Metrics MATR Workshop at the Eighth Conference of the Association for Machine Translation in the Americas (AMTA), vol. 555 (2008)"},{"issue":"3","key":"42_CR16","doi-asserted-by":"crossref","first-page":"130","DOI":"10.1108\/eb046814","volume":"14","author":"MF Porter","year":"1980","unstructured":"Porter, M.F.: An algorithm for suffix stripping. Program 14(3), 130\u2013137 (1980)","journal-title":"Program"},{"issue":"2\u20133","key":"42_CR17","doi-asserted-by":"crossref","first-page":"105","DOI":"10.1007\/s10590-009-9059-4","volume":"23","author":"A Lavie","year":"2009","unstructured":"Lavie, A., Denkowski, M.J.: The METEOR metric for automatic evaluation of machine translation. Mach. Transl. 23(2\u20133), 105\u2013115 (2009)","journal-title":"Mach. Transl."},{"key":"42_CR18","doi-asserted-by":"crossref","unstructured":"Allan, J., Wade, C., Bolivar, A.: Retrieval and novelty detection at the sentence level. In: Proceedings of the 26th Annual International ACM SIGIR Conference on Research and Development in Informaion Retrieval (SIGIR 2003), pp. 314\u2013321 (2003)","DOI":"10.1145\/860435.860493"},{"key":"42_CR19","doi-asserted-by":"crossref","first-page":"203","DOI":"10.1002\/asi.10170","volume":"54","author":"TC Hoad","year":"2003","unstructured":"Hoad, T.C., Zobel, J.: Methods for identifying versioned and plagiarised documents. J. Am. Soc. Inform. Sci. Technol. 54, 203\u2013215 (2003)","journal-title":"J. Am. Soc. Inform. Sci. Technol."},{"key":"42_CR20","doi-asserted-by":"crossref","unstructured":"Metzler, D., Bernstein, Y., Croft, W.B., Moffat, A., Zobel, J.: Similarity measures for tracking information flow. In: Proceedings of the 14th ACM International Conference on Information And Knowledge Management (CIKM), pp. 517\u2013524 (2005)","DOI":"10.1145\/1099554.1099695"},{"key":"42_CR21","doi-asserted-by":"crossref","unstructured":"Barzilay, R., Lee, L.: Learning to paraphrase: an unsupervised approach using multiple-sequence alignment. In: Proceedings of the Conference of the North American Chapter of the Association for Computational Linguistics on Human Language Technology (NAACL), vol. 1, pp. 16\u201323 (2003)","DOI":"10.3115\/1073445.1073448"},{"key":"42_CR22","unstructured":"Dolan, W.B., Brockett, C.: Automatically constructing a corpus of sentential paraphrases. In: Proceedings of the Third International Workshop on Paraphrasing (IWP) (2005)"},{"issue":"8","key":"42_CR23","doi-asserted-by":"crossref","first-page":"1138","DOI":"10.1109\/TKDE.2006.130","volume":"18","author":"Y Li","year":"2006","unstructured":"Li, Y., McLean, D., Bandar, Z.A., O\u2019Shea, J.D., Crockett, K.: Sentence similarity based on semantic nets and corpus statistics. IEEE Trans. Knowl. Data Eng. 18(8), 1138\u20131150 (2006)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"42_CR24","doi-asserted-by":"crossref","unstructured":"O\u2019Shea, J., Bandar, Z., Crockett, K.: A new benchmark dataset with production methodology for short text semantic similarity algorithms. ACM Trans. Speech Lang. Process. (TSLP) 10(4) (2013). Article no. 19","DOI":"10.1145\/2537046"},{"key":"42_CR25","unstructured":"Agirre, E., Diab, M., Cer, D., Gonzalez-Agirre, A.: Semeval- task 6: A pilot on semantic textual similarity. In: Proceedings of the First Joint Conference on Lexical and Computational Semantics, vol. 1, Proceedings of the Main Conference and the Shared Task. Proceedings of the Sixth International Workshop on Semantic Evaluation, vol. 2, pp. 385\u2013393 (2012)"},{"key":"42_CR26","unstructured":"Agirre, E., Cer, D., Diab, M., Dolan, B.: SemEval-2012 task 6 corpus. University of York (distributor) (2012). https:\/\/www.cs.york.ac.uk\/semeval-2012\/task6\/"},{"key":"42_CR27","unstructured":"Microsoft Research, Microsoft Resarch Video Description Corpus. Microsoft Corporation (2010). http:\/\/research.microsoft.com\/en-us\/downloads\/38cf15fd-b8df-477e-a4e4-a4680caa75af\/"},{"key":"42_CR28","doi-asserted-by":"crossref","unstructured":"Callison-Burch, C.: Workshop on statistical machine translation at ACL 2007 - development data. Johns Hopkins University (2008). http:\/\/www.statmt.org\/wmt08\/shared-evaluation-task.html","DOI":"10.3115\/1626394"},{"key":"42_CR29","unstructured":"Banerjee, S., Pedersen, T.: Extended gloss overlaps as a measure of semantic relatedness. In: Proceedings of the 18th International Joint Conference on Artificial Intelligence (IJCAI), vol. 3, pp. 805\u2013810 (2003)"},{"key":"42_CR30","doi-asserted-by":"crossref","first-page":"181","DOI":"10.1613\/jair.2308","volume":"30","author":"SP Ponzetto","year":"2007","unstructured":"Ponzetto, S.P., Strube, M.: Knowledge derived from wikipedia for computing semantic relatedness. J. Artif. Intell. Res. 30, 181\u2013212 (2007)","journal-title":"J. Artif. Intell. Res."},{"key":"42_CR31","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"85","DOI":"10.1007\/3-540-45452-7_9","volume-title":"Combinatorial Pattern Matching","author":"D Shapira","year":"2002","unstructured":"Shapira, D., Storer, J.A.: Edit distance with move operations. In: Apostolico, A., Takeda, M. (eds.) CPM 2002. LNCS, vol. 2373, pp. 85\u201398. Springer, Heidelberg (2002)"},{"key":"42_CR32","unstructured":"Lee, M.D., Pincombe, B.M., Welsh, M.B.: An empirical evaluation of models of text document similarity. In: Proceedings of the 27th Annual Conference of the Cognitive Science Society, pp. 1254\u20131259 (2005)"},{"issue":"6","key":"42_CR33","doi-asserted-by":"crossref","first-page":"391","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9","volume":"41","author":"S Deerwester","year":"1990","unstructured":"Deerwester, S., Dumais, S.T., Furnas, G.W., Landauer, T.K., Harshman, R.: Indexing by latent semantic analysis. J. Am. Soc. Inf. Sci. 41(6), 391\u2013407 (1990)","journal-title":"J. Am. Soc. Inf. Sci."},{"key":"42_CR34","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"837","DOI":"10.1007\/978-3-319-30671-1_76","volume-title":"Advances in Information Retrieval","author":"I Sochenkov","year":"2016","unstructured":"Sochenkov, I., Zubarev, D., Tikhomirov, I., Smirnov, I., Shelmanov, A., Suvorov, R., Osipov, G.: Exactus like: plagiarism detection in scientific texts. In: Ferro, N., et al. (eds.) ECIR 2016. LNCS, vol. 9626, pp. 837\u2013840. Springer, Heidelberg (2016)"},{"key":"42_CR35","doi-asserted-by":"crossref","first-page":"64","DOI":"10.1016\/j.inffus.2015.05.006","volume":"27","author":"JD Vel\u00e1squez","year":"2016","unstructured":"Vel\u00e1squez, J.D., Covacevich, Y., Molina, F., Marrese-Taylor, E., Rodr\u00edguez, C., Bravo-Marquez, F.: DOCODE 3.0 (DOcument COpy DEtector): a system for plagiarism detection by applying an information fusion process from multiple documental data sources. Inf. Fusion 27, 64\u201375 (2016)","journal-title":"Inf. Fusion"},{"key":"42_CR36","doi-asserted-by":"crossref","first-page":"114","DOI":"10.1016\/j.knosys.2015.12.009","volume":"95","author":"D-K Chae","year":"2016","unstructured":"Chae, D.-K., Ha, J., Kim, S.-W., Kang, B., Im, E.G., Park, S.: Credible, resilient, and scalable detection of software plagiarism using authority histograms. Knowl.-Based Syst. 95, 114\u2013124 (2016)","journal-title":"Knowl.-Based Syst."},{"issue":"1","key":"42_CR37","doi-asserted-by":"crossref","first-page":"457","DOI":"10.1007\/s11192-015-1756-6","volume":"106","author":"I Jaric","year":"2016","unstructured":"Jaric, I.: High time for a common plagiarism detection system. Scientometrics 106(1), 457\u2013459 (2016)","journal-title":"Scientometrics"},{"key":"42_CR38","doi-asserted-by":"crossref","unstructured":"Cuzzocrea, A., Sacc\u00e0, D., Ullman, J.D.: Big data: a research agenda. In: Proceedings of the 17th International Database Engineering and Applications Symposium (IDEAS), pp. 198\u2013203 (2013)","DOI":"10.1145\/2513591.2527071"},{"key":"42_CR39","doi-asserted-by":"crossref","unstructured":"Cuzzocrea, A., Bellatreche, L., Song, I.-Y.: Data warehousing, OLAP over big data: current challenges and future research directions. In: Proceedings of the 16th International Workshop on Data Warehousing and OLAP (DOLAP), pp. 67\u201370 (2013)","DOI":"10.1145\/2513190.2517828"},{"key":"42_CR40","doi-asserted-by":"crossref","unstructured":"Cuzzocrea, A.: Analytics over big data: exploring the convergence of data warehousing, OLAP and data-intensive cloud infrastructures.In: Proceedings of the 37th Annual IEEE Computer Software and Applications Conference (COMPSAC), pp. 481\u2013483 (2013)","DOI":"10.1109\/COMPSAC.2013.152"}],"container-title":["Lecture Notes in Computer Science","Computational Science and Its Applications \u2013 ICCSA 2016"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-42092-9_42","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,19]],"date-time":"2023-08-19T02:35:23Z","timestamp":1692412523000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-42092-9_42"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319420912","9783319420929"],"references-count":40,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-42092-9_42","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2016]]}}}