{"id":"https://openalex.org/W2017009364","doi":"https://doi.org/10.1145/2016039.2016067","title":"Quantifying the similiarities between source code lexicons","display_name":"Quantifying the similiarities between source code lexicons","publication_year":2011,"publication_date":"2011-03-24","ids":{"openalex":"https://openalex.org/W2017009364","doi":"https://doi.org/10.1145/2016039.2016067","mag":"2017009364"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/2016039.2016067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020479596","display_name":"Lauren R. Biggers","orcid":null},"institutions":[{"id":"https://openalex.org/I17301866","display_name":"University of Alabama","ror":"https://ror.org/03xrrjk67","country_code":"US","type":"education","lineage":["https://openalex.org/I17301866"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lauren R. Biggers","raw_affiliation_strings":["The University of Alabama (Tuscaloosa, AL)"],"affiliations":[{"raw_affiliation_string":"The University of Alabama (Tuscaloosa, AL)","institution_ids":["https://openalex.org/I17301866"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051151566","display_name":"Nicholas A. Kraft","orcid":"https://orcid.org/0000-0002-7960-766X"},"institutions":[{"id":"https://openalex.org/I17301866","display_name":"University of Alabama","ror":"https://ror.org/03xrrjk67","country_code":"US","type":"education","lineage":["https://openalex.org/I17301866"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nicholas A. Kraft","raw_affiliation_strings":["The University of Alabama (Tuscaloosa, AL)"],"affiliations":[{"raw_affiliation_string":"The University of Alabama (Tuscaloosa, AL)","institution_ids":["https://openalex.org/I17301866"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.388,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":3,"citation_normalized_percentile":{"value":0.513597,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":76,"max":78},"biblio":{"volume":null,"issue":null,"first_page":"80","last_page":"85"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.9955,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9904,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.52425766},{"id":"https://openalex.org/keywords/program-comprehension","display_name":"Program comprehension","score":0.43352214}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.81326437},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.81007355},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.7622279},{"id":"https://openalex.org/C548217200","wikidata":"https://www.wikidata.org/wiki/Q251","display_name":"Java","level":2,"score":0.65753067},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.64119923},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5537065},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5525701},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.52425766},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.47275314},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.44321302},{"id":"https://openalex.org/C2777561058","wikidata":"https://www.wikidata.org/wiki/Q2652119","display_name":"Program comprehension","level":4,"score":0.43352214},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38288614},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33080956},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32869822},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.32849622},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.23234501},{"id":"https://openalex.org/C149091818","wikidata":"https://www.wikidata.org/wiki/Q2429814","display_name":"Software system","level":3,"score":0.17379102},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.115579486},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.073569834},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/2016039.2016067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.46,"display_name":"Quality education"}],"grants":[{"funder":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation","award_id":"915559"}],"datasets":[],"versions":[],"referenced_works_count":25,"referenced_works":["https://openalex.org/W1490674333","https://openalex.org/W1525720009","https://openalex.org/W1967995512","https://openalex.org/W1992055950","https://openalex.org/W2018663431","https://openalex.org/W2041853131","https://openalex.org/W2056056700","https://openalex.org/W2099969795","https://openalex.org/W2104876936","https://openalex.org/W2117990499","https://openalex.org/W2128581098","https://openalex.org/W2129669092","https://openalex.org/W2135866290","https://openalex.org/W2139543149","https://openalex.org/W2141102925","https://openalex.org/W2145400454","https://openalex.org/W2147122181","https://openalex.org/W2152474046","https://openalex.org/W2156833313","https://openalex.org/W2158324307","https://openalex.org/W2163665793","https://openalex.org/W2171816001","https://openalex.org/W2913215602","https://openalex.org/W2990138404","https://openalex.org/W4302978359"],"related_works":["https://openalex.org/W3135060008","https://openalex.org/W3104152981","https://openalex.org/W3008773848","https://openalex.org/W2810057064","https://openalex.org/W2165862892","https://openalex.org/W2139694402","https://openalex.org/W2136808032","https://openalex.org/W2122804569","https://openalex.org/W2098192829","https://openalex.org/W2066182606"],"abstract_inverted_index":{"Several":[0],"recent":[1],"static":[2],"analysis":[3],"techniques":[4,29],"automate":[5],"software":[6],"understanding":[7],"activities":[8],"by":[9],"extracting":[10,55],"textual":[11],"information":[12,18,50],"from":[13,116,129],"source":[14,26,82,106],"code":[15,27,83],"and":[16,57,91,145],"applying":[17],"retrieval":[19,28],"models":[20],"to":[21,118,131,142],"the":[22,33,46,52,78,87,121,125,134,140],"extracted":[23],"corpora.":[24],"These":[25],"show":[30],"efficacy,":[31],"but":[32],"literature":[34,47],"provides":[35,48],"no":[36],"guidance":[37],"regarding":[38,51],"configuration":[39],"of":[40,54,103,120,133],"their":[41],"constituent":[42],"processes.":[43],"For":[44],"example,":[45],"conflicting":[49],"benefit":[53],"comments":[56,126,144],"string":[58,92,146],"literals":[59,147],"along":[60],"with":[61],"identifiers":[62],"such":[63],"as":[64],"method":[65],"or":[66],"variable":[67],"names.":[68],"In":[69],"this":[70],"paper":[71],"we":[72],"present":[73],"an":[74],"initial":[75],"investigation":[76],"into":[77],"similarities":[79],"between":[80],"three":[81,96],"lexicons":[84],"described":[85],"in":[86],"literature:":[88],"identifiers,":[89],"comments,":[90],"literals.":[93],"We":[94],"address":[95],"research":[97],"questions":[98],"using":[99],"a":[100],"case":[101],"study":[102],"six":[104],"open":[105],"Java":[107],"projects.":[108],"The":[109],"results":[110],"indicate":[111],"that":[112],"methods":[113],"uniquely":[114,127],"contain":[115,128],"30%":[117],"60%":[119],"projects'":[122],"terms,":[123],"whereas":[124],"22%":[130],"45%":[132],"terms.":[135,154],"Future":[136],"work":[137],"includes":[138],"analyzing":[139],"extent":[141],"which":[143],"introduce":[148],"domain":[149],"terms":[150],"rather":[151],"than":[152],"non-domain":[153]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2017009364","counts_by_year":[{"year":2018,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2024-12-10T22:00:02.449590","created_date":"2016-06-24"}