{"id":"https://openalex.org/W2050703362","doi":"https://doi.org/10.1109/scam.2010.19","title":"Language-Independent Clone Detection Applied to Plagiarism Detection","display_name":"Language-Independent Clone Detection Applied to Plagiarism Detection","publication_year":2010,"publication_date":"2010-09-01","ids":{"openalex":"https://openalex.org/W2050703362","doi":"https://doi.org/10.1109/scam.2010.19","mag":"2050703362"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/scam.2010.19","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022820267","display_name":"Romain Brixtel","orcid":null},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I98702875","display_name":"Universit\u00e9 de Caen Normandie","ror":"https://ror.org/051kpcy16","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210105918","https://openalex.org/I98702875"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Romain Brixtel","raw_affiliation_strings":["GREYC-CNRS, Univ. of Caen Basse-Normandie, Caen, France"],"affiliations":[{"raw_affiliation_string":"GREYC-CNRS, Univ. of Caen Basse-Normandie, Caen, France","institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I98702875"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082784886","display_name":"Mathieu Fontaine","orcid":"https://orcid.org/0000-0002-7657-6271"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I98702875","display_name":"Universit\u00e9 de Caen Normandie","ror":"https://ror.org/051kpcy16","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210105918","https://openalex.org/I98702875"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Mathieu Fontaine","raw_affiliation_strings":["GREYC-CNRS, Univ. of Caen Basse-Normandie, Caen, France"],"affiliations":[{"raw_affiliation_string":"GREYC-CNRS, Univ. of Caen Basse-Normandie, Caen, France","institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I98702875"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088549422","display_name":"Boris Lesner","orcid":null},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I98702875","display_name":"Universit\u00e9 de Caen Normandie","ror":"https://ror.org/051kpcy16","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210105918","https://openalex.org/I98702875"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Boris Lesner","raw_affiliation_strings":["GREYC-CNRS, Univ. of Caen Basse-Normandie, Caen, France"],"affiliations":[{"raw_affiliation_string":"GREYC-CNRS, Univ. of Caen Basse-Normandie, Caen, France","institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I98702875"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024898630","display_name":"Cyril Bazin","orcid":null},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I98702875","display_name":"Universit\u00e9 de Caen Normandie","ror":"https://ror.org/051kpcy16","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210105918","https://openalex.org/I98702875"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Cyril Bazin","raw_affiliation_strings":["GREYC-CNRS, Univ. of Caen Basse-Normandie, Caen, France"],"affiliations":[{"raw_affiliation_string":"GREYC-CNRS, Univ. of Caen Basse-Normandie, Caen, France","institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I98702875"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031712876","display_name":"Romain Robbes","orcid":"https://orcid.org/0000-0003-4569-6868"},"institutions":[{"id":"https://openalex.org/I69737025","display_name":"University of Chile","ror":"https://ror.org/047gc3g35","country_code":"CL","type":"education","lineage":["https://openalex.org/I69737025"]}],"countries":["CL"],"is_corresponding":false,"raw_author_name":"Romain Robbes","raw_affiliation_strings":["DCC University of Chile, Santiago, Chile"],"affiliations":[{"raw_affiliation_string":"DCC University of Chile, Santiago, Chile","institution_ids":["https://openalex.org/I69737025"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":52,"citation_normalized_percentile":{"value":0.991604,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"77","last_page":"86"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9982,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11492","display_name":"Academic integrity and plagiarism","score":0.9861,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/plagiarism-detection","display_name":"Plagiarism detection","score":0.6779275},{"id":"https://openalex.org/keywords/python","display_name":"Python","score":0.53934526},{"id":"https://openalex.org/keywords/haskell","display_name":"Haskell","score":0.4774109},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness","score":0.43519065},{"id":"https://openalex.org/keywords/clone","display_name":"clone (Java method)","score":0.41516396}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.85618925},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.7416369},{"id":"https://openalex.org/C2780907237","wikidata":"https://www.wikidata.org/wiki/Q2986238","display_name":"Plagiarism detection","level":2,"score":0.6779275},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.6288346},{"id":"https://openalex.org/C548217200","wikidata":"https://www.wikidata.org/wiki/Q251","display_name":"Java","level":2,"score":0.60873646},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.53934526},{"id":"https://openalex.org/C2780624054","wikidata":"https://www.wikidata.org/wiki/Q34010","display_name":"Haskell","level":3,"score":0.4774109},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.43519065},{"id":"https://openalex.org/C81089528","wikidata":"https://www.wikidata.org/wiki/Q5134986","display_name":"clone (Java method)","level":3,"score":0.41516396},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.38809133},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3155444},{"id":"https://openalex.org/C42383842","wikidata":"https://www.wikidata.org/wiki/Q193076","display_name":"Functional programming","level":2,"score":0.21474302},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C552990157","wikidata":"https://www.wikidata.org/wiki/Q7430","display_name":"DNA","level":2,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/scam.2010.19","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://hal.archives-ouvertes.fr/hal-01067165","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://hal.science/hal-01067165","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, justice, and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.59}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":23,"referenced_works":["https://openalex.org/W1583371541","https://openalex.org/W1647671624","https://openalex.org/W1971075060","https://openalex.org/W1980482639","https://openalex.org/W2073265902","https://openalex.org/W2074529754","https://openalex.org/W2096491586","https://openalex.org/W2106487114","https://openalex.org/W2107464569","https://openalex.org/W2109943392","https://openalex.org/W2111295912","https://openalex.org/W2119538795","https://openalex.org/W2121412398","https://openalex.org/W2128859735","https://openalex.org/W2128888088","https://openalex.org/W2138756793","https://openalex.org/W2146659255","https://openalex.org/W2157532207","https://openalex.org/W2169470206","https://openalex.org/W2172244770","https://openalex.org/W2221569141","https://openalex.org/W2222512263","https://openalex.org/W3003280364"],"related_works":["https://openalex.org/W4287331153","https://openalex.org/W4224015079","https://openalex.org/W3173165160","https://openalex.org/W3127649977","https://openalex.org/W3127553152","https://openalex.org/W3002459461","https://openalex.org/W2914826750","https://openalex.org/W2155491649","https://openalex.org/W2100097978","https://openalex.org/W1985086575"],"abstract_inverted_index":{"Clone":[0],"detection":[1,30,34,48,59],"is":[2,130,143],"usually":[3],"applied":[4,31],"in":[5,17,35,70,100,107],"the":[6,26,36,63,66,75,115,122,126,137,150],"context":[7,37],"of":[8,14,28,38,54,65,110,169,177],"detecting":[9],"small-to":[10],"medium":[11],"scale":[12],"fragments":[13],"duplicated":[15],"code":[16,40,77],"large":[18],"software":[19],"systems.":[20],"In":[21],"this":[22,71],"paper,":[23],"we":[24,68,112,128],"address":[25],"problem":[27],"clone":[29,58],"to":[32,56,89,158,190,196],"plagiarism":[33],"source":[39,76,171],"assignments":[41,98],"done":[42],"by":[43,101],"computer":[44,102],"science":[45,103],"students.":[46],"Plagiarism":[47],"comes":[49],"with":[50],"a":[51,83,108,174],"distinct":[52],"set":[53],"constraints":[55],"usual":[57],"approaches,":[60],"which":[61],"influenced":[62],"design":[64],"approach":[67,127,187],"present":[69],"paper.":[72],"For":[73],"instance,":[74],"can":[78,105],"be":[79,93,106],"heavily":[80],"changed":[81],"at":[82,114,153],"superficial":[84],"level":[85,117],"(in":[86],"an":[87,146],"attempt":[88],"look":[90],"genuine),":[91],"yet":[92],"functionally":[94],"very":[95],"similar.":[96],"Since":[97],"turned":[99],"students":[104],"variety":[109],"languages,":[111],"work":[113],"syntactic":[116],"and":[118,132,195,201],"do":[119],"not":[120],"consider":[121],"source-code":[123],"semantics.":[124],"Consequently,":[125],"propose":[129],"endogenous":[131],"makes":[133],"no":[134],"assumption":[135],"about":[136],"programming":[138,178],"language":[139],"being":[140],"analysed.":[141],"It":[142],"based":[144],"on":[145,167],"alignment":[147],"method":[148],"using":[149],"parallel":[151],"principle":[152],"local":[154],"resolution":[155],"(character":[156],"level)":[157],"compute":[159],"similarities":[160],"between":[161],"documents.":[162],"We":[163],"tested":[164],"our":[165],"framework":[166],"hundreds":[168],"real":[170],"files,":[172],"involving":[173],"wide":[175],"array":[176],"languages":[179],"(Java,":[180],"C,":[181],"Python,":[182],"PHP,":[183],"Haskell,":[184],"bash).":[185],"Our":[186],"allowed":[188],"us":[189],"discover":[191],"previously":[192],"undetected":[193],"frauds,":[194],"empirically":[197],"evaluate":[198],"its":[199],"accuracy":[200],"robustness.":[202]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2050703362","counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":5},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":4}],"updated_date":"2024-12-14T15:23:08.318802","created_date":"2016-06-24"}