{"id":"https://openalex.org/W3006121039","doi":"https://doi.org/10.1089/cmb.2019.0500","title":"Incorporating Nearest-Neighbor Site Dependence into Protein Evolution Models","display_name":"Incorporating Nearest-Neighbor Site Dependence into Protein Evolution Models","publication_year":2020,"publication_date":"2020-02-13","ids":{"openalex":"https://openalex.org/W3006121039","doi":"https://doi.org/10.1089/cmb.2019.0500","mag":"3006121039","pmid":"https://pubmed.ncbi.nlm.nih.gov/32053390","pmcid":"https://www.ncbi.nlm.nih.gov/pmc/articles/7081252"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1089/cmb.2019.0500","pdf_url":null,"source":{"id":"https://openalex.org/S78571599","display_name":"Journal of Computational Biology","issn_l":"1066-5277","issn":["1066-5277","1557-8666"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320443","host_organization_name":"Mary Ann Liebert, Inc.","host_organization_lineage":["https://openalex.org/P4310320443"],"host_organization_lineage_names":["Mary Ann Liebert, Inc."],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7081252","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110718195","display_name":"Gary Larson","orcid":null},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"funder","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gary Larson","raw_affiliation_strings":["Department of Statistical Science, Duke University, Durham, North Carolina."],"affiliations":[{"raw_affiliation_string":"Department of Statistical Science, Duke University, Durham, North Carolina.","institution_ids":["https://openalex.org/I170897317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064952920","display_name":"Jeffrey L. Thorne","orcid":"https://orcid.org/0000-0003-3779-5743"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"funder","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jeffrey L. Thorne","raw_affiliation_strings":["Department of Biological Sciences, North Carolina State University, Raleigh, North Carolina.","Department of Statistics, North Carolina State University, Raleigh, North Carolina."],"affiliations":[{"raw_affiliation_string":"Department of Biological Sciences, North Carolina State University, Raleigh, North Carolina.","institution_ids":["https://openalex.org/I137902535"]},{"raw_affiliation_string":"Department of Statistics, North Carolina State University, Raleigh, North Carolina.","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077085817","display_name":"Scott C. Schmidler","orcid":"https://orcid.org/0009-0006-3733-3716"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"funder","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Scott Schmidler","raw_affiliation_strings":["Department of Computer Science, Duke University, Durham, North Carolina.","Department of Statistical Science, Duke University, Durham, North Carolina."],"affiliations":[{"raw_affiliation_string":"Department of Statistical Science, Duke University, Durham, North Carolina.","institution_ids":["https://openalex.org/I170897317"]},{"raw_affiliation_string":"Department of Computer Science, Duke University, Durham, North Carolina.","institution_ids":["https://openalex.org/I170897317"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5077085817"],"corresponding_institution_ids":["https://openalex.org/I170897317"],"apc_list":null,"apc_paid":null,"fwci":0.158,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.474867,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":82,"max":83},"biblio":{"volume":"27","issue":"3","first_page":"361","last_page":"375"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10012","display_name":"Genetic diversity and population structure","score":0.9808,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9807,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/multiple-sequence-alignment","display_name":"Multiple sequence alignment","score":0.5672836},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.47111583},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.41254842}],"concepts":[{"id":"https://openalex.org/C193252679","wikidata":"https://www.wikidata.org/wiki/Q242125","display_name":"Phylogenetic tree","level":3,"score":0.64288056},{"id":"https://openalex.org/C88031987","wikidata":"https://www.wikidata.org/wiki/Q1377767","display_name":"Multiple sequence alignment","level":5,"score":0.5672836},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.51383454},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.47111583},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.45409364},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.42893735},{"id":"https://openalex.org/C90132467","wikidata":"https://www.wikidata.org/wiki/Q171184","display_name":"Phylogenetics","level":3,"score":0.41598064},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.41254842},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.39019647},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.3790513},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3552957},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.34857565},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.20614672},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.1931245},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019143","descriptor_name":"Evolution, Molecular","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D040681","descriptor_name":"Structural Homology, Protein","qualifier_ui":"","qualifier_name":null,"is_major_topic":false}],"locations_count":3,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1089/cmb.2019.0500","pdf_url":null,"source":{"id":"https://openalex.org/S78571599","display_name":"Journal of Computational Biology","issn_l":"1066-5277","issn":["1066-5277","1557-8666"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320443","host_organization_name":"Mary Ann Liebert, Inc.","host_organization_lineage":["https://openalex.org/P4310320443"],"host_organization_lineage_names":["Mary Ann Liebert, Inc."],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7081252","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/32053390","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7081252","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Zero hunger","id":"https://metadata.un.org/sdg/2","score":0.44}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":10,"referenced_works":["https://openalex.org/W1985040965","https://openalex.org/W2009570821","https://openalex.org/W2090617952","https://openalex.org/W2092979861","https://openalex.org/W2094548241","https://openalex.org/W2111755094","https://openalex.org/W2129039174","https://openalex.org/W2157831257","https://openalex.org/W2186750819","https://openalex.org/W3199943451"],"related_works":["https://openalex.org/W65850283","https://openalex.org/W3186624150","https://openalex.org/W2949296710","https://openalex.org/W2883025420","https://openalex.org/W2804480386","https://openalex.org/W2174809885","https://openalex.org/W2132972885","https://openalex.org/W2111939425","https://openalex.org/W2057191541","https://openalex.org/W1992658754"],"abstract_inverted_index":{"Evolutionary":[0],"models":[1,23],"of":[2,13,21,29,41,48,120,165,184,199],"proteins":[3],"are":[4],"widely":[5,53],"used":[6,54],"for":[7,71,105],"statistical":[8,69],"sequence":[9,96,186,202],"alignment":[10],"and":[11,15,58,61,79,85,171],"inference":[12],"homology":[14,64],"phylogeny.":[16],"However,":[17],"the":[18,38,152,193,197],"vast":[19],"majority":[20],"these":[22],"rely":[24],"on":[25,37],"an":[26],"unrealistic":[27],"assumption":[28],"independent":[30],"evolution":[31,74,203],"between":[32],"sites.":[33],"Here":[34,98],"we":[35,99,189],"focus":[36],"related":[39],"problem":[40],"protein":[42,72,121],"structure":[43,122],"alignment,":[44],"a":[45,117,126,132,162,181],"classic":[46],"tool":[47],"computational":[49,145],"biology":[50],"that":[51,91,158],"is":[52,116],"to":[55,62,81,103,191],"identify":[56],"structural":[57,73],"functional":[59],"similarity":[60],"infer":[63],"among":[65,109],"proteins.":[66],"A":[67],"site-independent":[68,153,201],"model":[70,102,119,139,154,183],"has":[75],"previously":[76],"been":[77],"introduced":[78],"shown":[80],"significantly":[82],"improve":[83,174],"alignments":[84],"phylogenetic":[86,175],"inferences":[87],"compared":[88,150],"with":[89,131,142,151],"approaches":[90],"utilize":[92],"only":[93],"amino":[94,111],"acid":[95,112],"information.":[97],"extend":[100],"this":[101,159],"account":[104],"correlated":[106],"evolutionary":[107,169],"drift":[108],"neighboring":[110],"positions.":[113],"The":[114],"result":[115],"spatiotemporal":[118],"evolution,":[123,187],"described":[124],"by":[125],"multivariate":[127],"diffusion":[128],"process":[129],"convolved":[130],"spatial":[133],"birth\u2013death":[134],"process.":[135],"This":[136],"extended":[137],"site-dependent":[138,185],"(SDM)":[140],"comes":[141],"little":[143],"additional":[144],"cost":[146],"or":[147],"analytical":[148],"complexity":[149],"(SIM).":[155],"We":[156,178],"demonstrate":[157,192],"SDM":[160],"yields":[161],"significant":[163],"reduction":[164],"bias":[166,194],"in":[167],"estimated":[168],"distances":[170],"helps":[172],"further":[173],"tree":[176],"reconstruction.":[177],"also":[179],"develop":[180],"simple":[182],"which":[188],"use":[190],"resulting":[195],"from":[196],"application":[198],"standard":[200],"models.":[204]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3006121039","counts_by_year":[{"year":2024,"cited_by_count":5},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-03-24T00:55:39.401218","created_date":"2020-02-24"}