{"id":"https://openalex.org/W2037437298","doi":"https://doi.org/10.1109/hisb.2012.17","title":"Demographics Identification: Variable Extraction Resource (DIVER)","display_name":"Demographics Identification: Variable Extraction Resource (DIVER)","publication_year":2012,"publication_date":"2012-09-01","ids":{"openalex":"https://openalex.org/W2037437298","doi":"https://doi.org/10.1109/hisb.2012.17","mag":"2037437298"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/hisb.2012.17","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038994451","display_name":"Alexander Hsieh","orcid":"https://orcid.org/0000-0003-4227-1952"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"funder","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alexander Hsieh","raw_affiliation_strings":["Department of Medicine University of California, San Diego La Jolla CA USA"],"affiliations":[{"raw_affiliation_string":"Department of Medicine University of California, San Diego La Jolla CA USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038899864","display_name":"Son Doan","orcid":"https://orcid.org/0000-0002-7284-1306"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"funder","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Son Doan","raw_affiliation_strings":["Department of Medicine University of California, San Diego La Jolla CA USA"],"affiliations":[{"raw_affiliation_string":"Department of Medicine University of California, San Diego La Jolla CA USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024836029","display_name":"Michael Conway","orcid":"https://orcid.org/0000-0002-0848-8835"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"funder","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Conway","raw_affiliation_strings":["Department of Medicine University of California, San Diego La Jolla CA USA"],"affiliations":[{"raw_affiliation_string":"Department of Medicine University of California, San Diego La Jolla CA USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043562937","display_name":"Ko\u2010Wei Lin","orcid":"https://orcid.org/0000-0001-6645-2091"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"funder","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ko-Wei Lin","raw_affiliation_strings":["Department of Medicine University of California, San Diego La Jolla CA USA"],"affiliations":[{"raw_affiliation_string":"Department of Medicine University of California, San Diego La Jolla CA USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020006174","display_name":"Hyeoneui Kim","orcid":"https://orcid.org/0000-0002-5931-7286"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"funder","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hyeoneui Kim","raw_affiliation_strings":["Department of Medicine University of California, San Diego La Jolla CA USA"],"affiliations":[{"raw_affiliation_string":"Department of Medicine University of California, San Diego La Jolla CA USA","institution_ids":["https://openalex.org/I36258959"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.493,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":4,"citation_normalized_percentile":{"value":0.632901,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":78,"max":80},"biblio":{"volume":null,"issue":null,"first_page":"40","last_page":"49"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9982,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9982,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9788,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10350","display_name":"Electronic Health Records Systems","score":0.9389,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/identification","display_name":"Identification","score":0.53782},{"id":"https://openalex.org/keywords/biorepository","display_name":"Biorepository","score":0.49152336}],"concepts":[{"id":"https://openalex.org/C547195049","wikidata":"https://www.wikidata.org/wiki/Q1725664","display_name":"Terminology","level":2,"score":0.60152084},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5749908},{"id":"https://openalex.org/C206497026","wikidata":"https://www.wikidata.org/wiki/Q1753883","display_name":"SNOMED CT","level":3,"score":0.5427849},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.53782},{"id":"https://openalex.org/C2780932742","wikidata":"https://www.wikidata.org/wiki/Q4915239","display_name":"Biorepository","level":3,"score":0.49152336},{"id":"https://openalex.org/C188087704","wikidata":"https://www.wikidata.org/wiki/Q369577","display_name":"Standardization","level":2,"score":0.48456898},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.41949677},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.38841003},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.16345263},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.097747445},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.085489035},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C116567970","wikidata":"https://www.wikidata.org/wiki/Q864217","display_name":"Biobank","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/hisb.2012.17","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":22,"referenced_works":["https://openalex.org/W1545151484","https://openalex.org/W1611804050","https://openalex.org/W1973234126","https://openalex.org/W2027779823","https://openalex.org/W2036543624","https://openalex.org/W2064337796","https://openalex.org/W2098201295","https://openalex.org/W2102729801","https://openalex.org/W2106797966","https://openalex.org/W2117998960","https://openalex.org/W2120789186","https://openalex.org/W2120989936","https://openalex.org/W2122402213","https://openalex.org/W2124785215","https://openalex.org/W2139865360","https://openalex.org/W2152410429","https://openalex.org/W2158505321","https://openalex.org/W2270018644","https://openalex.org/W2331798554","https://openalex.org/W2395740409","https://openalex.org/W3155472991","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W3128306253","https://openalex.org/W3031493161","https://openalex.org/W2405923535","https://openalex.org/W2390249510","https://openalex.org/W2389049429","https://openalex.org/W2387710870","https://openalex.org/W2350181254","https://openalex.org/W2039735462","https://openalex.org/W1708042184","https://openalex.org/W1511848092"],"abstract_inverted_index":{"Lack":[0],"of":[1,58,82,96,107,136],"standardization":[2],"in":[3,8,37,61,142],"representing":[4],"phenotype":[5,140],"data":[6,16],"generated":[7],"different":[9],"studies":[10,60],"is":[11,132],"a":[12,29,56,137],"major":[13],"barrier":[14],"to":[15,65,70],"reuse":[17],"for":[18,139],"cross":[19],"study":[20],"analyses.":[21],"To":[22],"address":[23],"this":[24],"issue,":[25],"we":[26],"developed":[27],"DIVER,":[28],"tool":[30,119],"that":[31,109],"identifies":[32],"and":[33,45,84,87],"standardizes":[34],"demographic":[35,77,99],"variables":[36,53,73,78,100,108],"dbGaP,":[38,62],"based":[39],"on":[40,116],"simple":[41],"natural":[42],"language":[43],"processing":[44],"standardized":[46],"terminology":[47],"mapping.":[48],"In":[49,90],"its":[50,127],"evaluation":[51],"using":[52],"(N=3,565)":[54],"from":[55],"range":[57],"pulmonary":[59],"DIVER":[63,92,110,131],"proved":[64],"be":[66],"an":[67,133],"effective":[68],"approach":[69],"standardizing":[71],"dbGaP":[72,143],"by":[74],"successfully":[75],"identifying":[76],"with":[79],"high":[80],"rates":[81],"recall":[83],"precision":[85],"(98%":[86],"94%,":[88],"respectively).":[89],"addition,":[91],"correctly":[93],"modeled":[94],"79%":[95],"the":[97,102],"identified":[98],"at":[101],"core":[103],"semantic":[104,128],"level.":[105],"Examination":[106],"could":[111],"not":[112],"handle":[113],"shed":[114],"light":[115],"where":[117],"our":[118],"needs":[120],"enhancement":[121],"so":[122],"it":[123],"can":[124],"further":[125],"improve":[126],"modeling":[129],"accuracy.":[130],"important":[134],"component":[135],"system":[138],"discovery":[141],"studies.":[144]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2037437298","counts_by_year":[{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":1}],"updated_date":"2025-03-25T00:10:14.291229","created_date":"2016-06-24"}