{"id":"https://openalex.org/W2589055133","doi":"https://doi.org/10.1145/3011141.3011160","title":"Maximal frequent sequence mining for finding software clones","display_name":"Maximal frequent sequence mining for finding software clones","publication_year":2016,"publication_date":"2016-11-28","ids":{"openalex":"https://openalex.org/W2589055133","doi":"https://doi.org/10.1145/3011141.3011160","mag":"2589055133"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3011141.3011160","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110349640","display_name":"Yoshihisa Udagawa","orcid":null},"institutions":[{"id":"https://openalex.org/I31618427","display_name":"Tokyo Polytechnic University","ror":"https://ror.org/035kpke84","country_code":"JP","type":"funder","lineage":["https://openalex.org/I31618427"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yoshihisa Udagawa","raw_affiliation_strings":["Tokyo Polytechnic University, Japan"],"affiliations":[{"raw_affiliation_string":"Tokyo Polytechnic University, Japan","institution_ids":["https://openalex.org/I31618427"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5110349640"],"corresponding_institution_ids":["https://openalex.org/I31618427"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":2,"citation_normalized_percentile":{"value":0.427025,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":73,"max":77},"biblio":{"volume":null,"issue":null,"first_page":"26","last_page":"33"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9926,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.992,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.42923218}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7066558},{"id":"https://openalex.org/C137877099","wikidata":"https://www.wikidata.org/wiki/Q1332977","display_name":"Subsequence","level":3,"score":0.55446106},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.54587966},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.5124986},{"id":"https://openalex.org/C120098539","wikidata":"https://www.wikidata.org/wiki/Q141001","display_name":"Longest common subsequence problem","level":2,"score":0.5003123},{"id":"https://openalex.org/C548217200","wikidata":"https://www.wikidata.org/wiki/Q251","display_name":"Java","level":2,"score":0.4927161},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.45690575},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4488745},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.42923218},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.42154858},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.40440294},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.39342988},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.35869303},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18911052},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.093981415},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3011141.3011160","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":9,"referenced_works":["https://openalex.org/W1565377632","https://openalex.org/W1567790484","https://openalex.org/W1587010832","https://openalex.org/W1676985236","https://openalex.org/W2027506564","https://openalex.org/W2049386694","https://openalex.org/W2165739648","https://openalex.org/W2166559705","https://openalex.org/W2407458134"],"related_works":["https://openalex.org/W4323338832","https://openalex.org/W4289596129","https://openalex.org/W4225868058","https://openalex.org/W3083981518","https://openalex.org/W25732909","https://openalex.org/W2389167168","https://openalex.org/W2170721049","https://openalex.org/W2088055539","https://openalex.org/W1999879627","https://openalex.org/W170643605"],"abstract_inverted_index":{"Software":[0],"clones":[1,22,167],"are":[2],"introduced":[3],"to":[4,67,83,94,165],"source":[5],"code":[6,12,48],"by":[7],"copying":[8],"and":[9,130,172],"slightly":[10],"modifying":[11],"fragments":[13],"for":[14,133],"reuse.":[15],"Thus,":[16],"the":[17,25,96,105,110,145,159,162],"problem":[18],"of":[19,27,55,71,79,100,112,116,123,137,147,161,168],"finding":[20],"software":[21,36],"is":[23],"essentially":[24],"detection":[26,38],"strings":[28],"that":[29,51,81],"partially":[30],"match.":[31],"This":[32],"paper":[33,141],"describes":[34],"a":[35,41,47,58,69,77,113,148],"clone":[37],"technique":[39,50],"using":[40,151],"sequential":[42,101],"pattern-mining":[43],"algorithm.":[44],"After":[45],"outlining":[46],"normalization":[49],"extracts":[52],"code-matching":[53],"statements":[54],"interest":[56],"from":[57,76],"specific":[59],"programming":[60],"language,":[61],"viz.,":[62],"Java,":[63],"we":[64],"discuss":[65],"how":[66],"extract":[68],"set":[70,78],"frequent":[72,92,107],"sequences":[73,80,93,117,138],"with":[74,90],"gaps":[75],"correspond":[82],"methods.":[84],"The":[85,121,140,156],"proposed":[86,163],"algorithm":[87,164],"also":[88,142],"deals":[89],"maximal":[91,106],"find":[95,166],"most":[97],"compact":[98],"representation":[99],"patterns.":[102],"We":[103],"define":[104],"sequence":[108],"in":[109],"context":[111],"partial":[114,135],"match":[115],"or":[118],"gapped":[119],"sequences.":[120],"novelty":[122],"our":[124],"approach":[125],"includes":[126],"modified":[127],"longest-common-subsequence":[128],"(LCS)":[129],"backtrace":[131],"algorithms":[132],"handling":[134],"matches":[136],"systematically.":[139],"reports":[143],"on":[144],"results":[146,157],"case":[149],"study":[150],"Apache":[152],"Struts":[153],"2.5.2":[154],"Core.":[155],"demonstrate":[158],"ability":[160],"Types":[169],"1,":[170],"2,":[171],"3.":[173]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2589055133","counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-03-15T17:09:25.264356","created_date":"2017-02-24"}