{"id":"https://openalex.org/W1985994919","doi":"https://doi.org/10.1109/icsm.2012.6405329","title":"Who's who in Gnome: Using LSA to merge software repository identities","display_name":"Who's who in Gnome: Using LSA to merge software repository identities","publication_year":2012,"publication_date":"2012-09-01","ids":{"openalex":"https://openalex.org/W1985994919","doi":"https://doi.org/10.1109/icsm.2012.6405329","mag":"1985994919"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsm.2012.6405329","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027088423","display_name":"Erik Kouters","orcid":null},"institutions":[{"id":"https://openalex.org/I83019370","display_name":"Eindhoven University of Technology","ror":"https://ror.org/02c2kyt77","country_code":"NL","type":"education","lineage":["https://openalex.org/I83019370"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Erik Kouters","raw_affiliation_strings":["Technische Universiteit Eindhoven, Den Dolech 2, P.O. Box 513, 5600 MB Eindhoven, The Netherlands#TAB#"],"affiliations":[{"raw_affiliation_string":"Technische Universiteit Eindhoven, Den Dolech 2, P.O. Box 513, 5600 MB Eindhoven, The Netherlands#TAB#","institution_ids":["https://openalex.org/I83019370"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050821883","display_name":"Bogdan Vasilescu","orcid":"https://orcid.org/0000-0003-4418-5783"},"institutions":[{"id":"https://openalex.org/I83019370","display_name":"Eindhoven University of Technology","ror":"https://ror.org/02c2kyt77","country_code":"NL","type":"education","lineage":["https://openalex.org/I83019370"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Bogdan Vasilescu","raw_affiliation_strings":["Technische Universiteit Eindhoven, Den Dolech 2, P.O. Box 513, 5600 MB Eindhoven, The Netherlands#TAB#"],"affiliations":[{"raw_affiliation_string":"Technische Universiteit Eindhoven, Den Dolech 2, P.O. Box 513, 5600 MB Eindhoven, The Netherlands#TAB#","institution_ids":["https://openalex.org/I83019370"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054753279","display_name":"Alexander Serebrenik","orcid":"https://orcid.org/0000-0002-1418-0095"},"institutions":[{"id":"https://openalex.org/I83019370","display_name":"Eindhoven University of Technology","ror":"https://ror.org/02c2kyt77","country_code":"NL","type":"education","lineage":["https://openalex.org/I83019370"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Alexander Serebrenik","raw_affiliation_strings":["Technische Universiteit Eindhoven, Den Dolech 2, P.O. Box 513, 5600 MB Eindhoven, The Netherlands#TAB#"],"affiliations":[{"raw_affiliation_string":"Technische Universiteit Eindhoven, Den Dolech 2, P.O. Box 513, 5600 MB Eindhoven, The Netherlands#TAB#","institution_ids":["https://openalex.org/I83019370"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029542014","display_name":"Mark van den Brand","orcid":"https://orcid.org/0000-0003-3529-6182"},"institutions":[{"id":"https://openalex.org/I83019370","display_name":"Eindhoven University of Technology","ror":"https://ror.org/02c2kyt77","country_code":"NL","type":"education","lineage":["https://openalex.org/I83019370"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Mark G. J. van den Brand","raw_affiliation_strings":["Technische Universiteit Eindhoven, Den Dolech 2, P.O. Box 513, 5600 MB Eindhoven, The Netherlands#TAB#"],"affiliations":[{"raw_affiliation_string":"Technische Universiteit Eindhoven, Den Dolech 2, P.O. Box 513, 5600 MB Eindhoven, The Netherlands#TAB#","institution_ids":["https://openalex.org/I83019370"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.61,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":64,"citation_normalized_percentile":{"value":0.936202,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"592","last_page":"595"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9916,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9866,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.67544127},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness","score":0.58821225},{"id":"https://openalex.org/keywords/latent-semantic-analysis","display_name":"Latent semantic analysis","score":0.50019956}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.82561743},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.67544127},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.6253029},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.58821225},{"id":"https://openalex.org/C170133592","wikidata":"https://www.wikidata.org/wiki/Q1806883","display_name":"Latent semantic analysis","level":2,"score":0.50019956},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4958044},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.46845317},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4293539},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10014692},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsm.2012.6405329","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Life on land","id":"https://metadata.un.org/sdg/15","score":0.6}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":13,"referenced_works":["https://openalex.org/W1983578042","https://openalex.org/W1990566545","https://openalex.org/W2039001182","https://openalex.org/W2039785095","https://openalex.org/W2076279155","https://openalex.org/W2079081534","https://openalex.org/W2119410041","https://openalex.org/W2136101509","https://openalex.org/W2163960678","https://openalex.org/W3150747159","https://openalex.org/W4240701274","https://openalex.org/W4251218026","https://openalex.org/W4252434862"],"related_works":["https://openalex.org/W83344948","https://openalex.org/W2802443881","https://openalex.org/W2364562957","https://openalex.org/W2354429408","https://openalex.org/W2351030537","https://openalex.org/W2350230178","https://openalex.org/W2350178533","https://openalex.org/W2119135658","https://openalex.org/W2101966962","https://openalex.org/W2001121861"],"abstract_inverted_index":{"Understanding":[0],"an":[1,5],"individual's":[2],"contribution":[3],"to":[4,15,39,61,111,131],"ecosystem":[6,20],"often":[7],"necessitates":[8],"integrating":[9],"information":[10],"from":[11],"multiple":[12],"repositories":[13,25],"corresponding":[14],"different":[16,22,36,49],"projects":[17],"within":[18],"the":[19,40,65,69,72,74,76,82,85,99],"or":[21],"kinds":[23],"of":[24,84,106,114,137,147,164],"(e.g.,":[26],"mail":[27],"archives":[28],"and":[29,103,141,166],"version":[30],"control":[31],"systems).":[32],"However,":[33],"recognising":[34],"that":[35,54],"contributions":[37],"belong":[38],"same":[41,70],"contributor":[42],"is":[43,52],"challenging,":[44],"since":[45],"developers":[46],"may":[47],"use":[48],"aliases.":[50],"It":[51],"known":[53],"existing":[55,107,160],"identity":[56,121],"merging":[57,122],"algorithms":[58,108,161],"are":[59],"sensitive":[60],"large":[62,89],"discrepancies":[63],"between":[64],"aliases":[66],"used":[67],"by":[68,145],"individual:":[71],"noisier":[73],"data,":[75],"worse":[77],"their":[78],"performance.":[79],"To":[80],"assess":[81],"scale":[83],"problem":[86],"for":[87],"a":[88,119,156],"software":[90],"ecosystem,":[91],"we":[92],"study":[93],"all":[94],"Gnome":[95,150],"Git":[96,151],"repositories,":[97],"classify":[98],"differences":[100,138],"in":[101,139,162],"aliases,":[102,140],"discuss":[104],"robustness":[105],"with":[109],"respect":[110],"these":[112],"types":[113,136],"differences.":[115],"We":[116],"then":[117],"propose":[118],"new":[120],"algorithm":[123],"based":[124],"on":[125,149,168],"Latent":[126],"Semantic":[127],"Analysis":[128],"(LSA),":[129],"designed":[130],"be":[132],"robust":[133],"against":[134],"more":[135],"evaluate":[142],"it":[143],"empirically":[144],"means":[146],"cross-validation":[148],"authors.":[152],"Our":[153],"results":[154],"show":[155],"clear":[157],"improvement":[158],"over":[159],"terms":[163],"precision":[165],"recall":[167],"worst-case":[169],"input":[170],"data.":[171]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W1985994919","counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":10},{"year":2014,"cited_by_count":8},{"year":2013,"cited_by_count":7}],"updated_date":"2025-01-18T12:54:58.183240","created_date":"2016-06-24"}