{"id":"https://openalex.org/W2090987348","doi":"https://doi.org/10.1002/asi.20105","title":"A probabilistic similarity metric for Medline records: A model for author name disambiguation","display_name":"A probabilistic similarity metric for Medline records: A model for author name disambiguation","publication_year":2004,"publication_date":"2004-11-05","ids":{"openalex":"https://openalex.org/W2090987348","doi":"https://doi.org/10.1002/asi.20105","mag":"2090987348"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1002/asi.20105","pdf_url":null,"source":{"id":"https://openalex.org/S80113298","display_name":"Journal of the American Society for Information Science and Technology","issn_l":"1532-2882","issn":["1532-2882","1532-2890"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":"http://arrowsmith.psych.uic.edu/arrowsmith_uic/tutorial/torvik_jasist_2005.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079566229","display_name":"Vetle I. Torvik","orcid":"https://orcid.org/0000-0002-0035-1850"},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vetle I. Torvik","raw_affiliation_strings":["Department of Psychiatry (MC912), University of Illinois, Chicago, 1601 W. Taylor Street, Chicago, IL 60612"],"affiliations":[{"raw_affiliation_string":"Department of Psychiatry (MC912), University of Illinois, Chicago, 1601 W. Taylor Street, Chicago, IL 60612","institution_ids":["https://openalex.org/I39422238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061783958","display_name":"Marc Weeber","orcid":null},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Marc Weeber","raw_affiliation_strings":["Department of Psychiatry (MC912), University of Illinois, Chicago, 1601 W. Taylor Street, Chicago, IL 60612"],"affiliations":[{"raw_affiliation_string":"Department of Psychiatry (MC912), University of Illinois, Chicago, 1601 W. Taylor Street, Chicago, IL 60612","institution_ids":["https://openalex.org/I39422238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103564473","display_name":"Don R. Swanson","orcid":null},"institutions":[{"id":"https://openalex.org/I40347166","display_name":"University of Chicago","ror":"https://ror.org/024mw5h28","country_code":"US","type":"education","lineage":["https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Don R. Swanson","raw_affiliation_strings":["Division of the Humanities, University of Chicago, Chicago, IL 60637"],"affiliations":[{"raw_affiliation_string":"Division of the Humanities, University of Chicago, Chicago, IL 60637","institution_ids":["https://openalex.org/I40347166"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033859037","display_name":"Neil R. Smalheiser","orcid":"https://orcid.org/0000-0003-1079-3406"},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Neil R. Smalheiser","raw_affiliation_strings":["Department of Psychiatry (MC912), University of Illinois, Chicago, 1601 W. Taylor Street, Chicago, IL 60612"],"affiliations":[{"raw_affiliation_string":"Department of Psychiatry (MC912), University of Illinois, Chicago, 1601 W. Taylor Street, Chicago, IL 60612","institution_ids":["https://openalex.org/I39422238"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":6.728,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":199,"citation_normalized_percentile":{"value":0.969393,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"56","issue":"2","first_page":"140","last_page":"158"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9981,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9921,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.76275694}],"concepts":[{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.76275694},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6859977},{"id":"https://openalex.org/C2779804580","wikidata":"https://www.wikidata.org/wiki/Q102047","display_name":"Suffix","level":2,"score":0.5974632},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.59678936},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5900795},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5735189},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.53488606},{"id":"https://openalex.org/C2777855551","wikidata":"https://www.wikidata.org/wiki/Q12310021","display_name":"Subject (documents)","level":2,"score":0.5036325},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49558318},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33708417},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.22057632},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.12658155},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1002/asi.20105","pdf_url":null,"source":{"id":"https://openalex.org/S80113298","display_name":"Journal of the American Society for Information Science and Technology","issn_l":"1532-2882","issn":["1532-2882","1532-2890"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.90.7609","pdf_url":"http://arrowsmith.psych.uic.edu/arrowsmith_uic/tutorial/torvik_jasist_2005.pdf","source":{"id":"https://openalex.org/S4306400349","display_name":"CiteSeer X (The Pennsylvania State University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I130769515","host_organization_name":"Pennsylvania State University","host_organization_lineage":["https://openalex.org/I130769515"],"host_organization_lineage_names":["Pennsylvania State University"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.90.7609","pdf_url":"http://arrowsmith.psych.uic.edu/arrowsmith_uic/tutorial/torvik_jasist_2005.pdf","source":{"id":"https://openalex.org/S4306400349","display_name":"CiteSeer X (The Pennsylvania State University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I130769515","host_organization_name":"Pennsylvania State University","host_organization_lineage":["https://openalex.org/I130769515"],"host_organization_lineage_names":["Pennsylvania State University"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":28,"referenced_works":["https://openalex.org/W1525742988","https://openalex.org/W1570958430","https://openalex.org/W1800493452","https://openalex.org/W1885411690","https://openalex.org/W1971784203","https://openalex.org/W1991885012","https://openalex.org/W2024030746","https://openalex.org/W2025572017","https://openalex.org/W2033614115","https://openalex.org/W2048045485","https://openalex.org/W2057729687","https://openalex.org/W2061312249","https://openalex.org/W2069334446","https://openalex.org/W2074302780","https://openalex.org/W2127674618","https://openalex.org/W2141585940","https://openalex.org/W2143683307","https://openalex.org/W2151393344","https://openalex.org/W2153252192","https://openalex.org/W2158608196","https://openalex.org/W2165612380","https://openalex.org/W2319660501","https://openalex.org/W2787478004","https://openalex.org/W2795929191","https://openalex.org/W2913519381","https://openalex.org/W4237045180","https://openalex.org/W4237720795","https://openalex.org/W4289256748"],"related_works":["https://openalex.org/W4388258507","https://openalex.org/W4311055779","https://openalex.org/W3128574596","https://openalex.org/W2989529099","https://openalex.org/W2981728181","https://openalex.org/W2978475281","https://openalex.org/W2761558751","https://openalex.org/W2748952813","https://openalex.org/W2391300236","https://openalex.org/W2371678724"],"abstract_inverted_index":{"Abstract":[0],"We":[1,120],"present":[2],"a":[3,10,35,42,106,123,139,146],"model":[4,33,112],"for":[5],"estimating":[6],"the":[7,29,64,97,111],"probability":[8,163],"that":[9,130,152],"pair":[11,43],"of":[12,44,80,82,109,148],"author":[13,87],"names":[14],"(sharing":[15],"last":[16],"name":[17,60,136],"and":[18,59,68,103,142],"first":[19,155],"initial),":[20],"appearing":[21],"on":[22,47,138],"two":[23],"different":[24],"Medline":[25],"articles,":[26,45],"refer":[27],"to":[28],"same":[30],"individual.":[31],"The":[32,70],"uses":[34],"simple":[36],"yet":[37],"powerful":[38],"similarity":[39,71],"profile":[40,72],"between":[41],"based":[46],"title,":[48],"journal":[49],"name,":[50,154],"coauthor":[51],"names,":[52],"medical":[53],"subject":[54],"headings":[55],"(MeSH),":[56],"language,":[57],"affiliation,":[58],"attributes":[61],"(prevalence":[62],"in":[63,92],"literature,":[65],"middle":[66],"initial,":[67],"suffix).":[69],"distribution":[73],"is":[74,100,113],"computed":[75],"from":[76],"reference":[77],"sets":[78],"consisting":[79],"pairs":[81],"articles":[83,150],"containing":[84],"almost":[85],"exclusively":[86],"matches":[88],"versus":[89],"nonmatches,":[90,110],"generated":[91,101],"an":[93,134],"unbiased":[94],"manner.":[95],"Although":[96],"match":[98,162],"set":[99],"automatically":[102],"might":[104],"contain":[105],"small":[107],"proportion":[108],"quite":[114],"robust":[115],"against":[116],"contamination":[117],"with":[118,151,161],"nonmatches.":[119],"have":[121],"created":[122],"free,":[124],"public":[125],"service":[126],"(\u201cAuthor\u2010ity\u201d:":[127],"http://arrowsmith.psych.uic.edu":[128],")":[129],"takes":[131],"as":[132,144],"input":[133],"author's":[135],"given":[137],"specific":[140],"article,":[141],"gives":[143],"output":[145],"list":[147],"all":[149],"(last":[153],"initial)":[156],"ranked":[157],"by":[158],"decreasing":[159],"similarity,":[160],"indicated.":[164]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2090987348","counts_by_year":[{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":13},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":12},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":11},{"year":2015,"cited_by_count":16},{"year":2014,"cited_by_count":26},{"year":2013,"cited_by_count":8},{"year":2012,"cited_by_count":13}],"updated_date":"2025-01-08T20:47:58.122727","created_date":"2016-06-24"}