{"id":"https://openalex.org/W2103609042","doi":"https://doi.org/10.1093/bioinformatics/btr263","title":"Genome annotation test with validation on transcription start site and ChIP-Seq for Pol-II binding data","display_name":"Genome annotation test with validation on transcription start site and ChIP-Seq for Pol-II binding data","publication_year":2011,"publication_date":"2011-05-09","ids":{"openalex":"https://openalex.org/W2103609042","doi":"https://doi.org/10.1093/bioinformatics/btr263","mag":"2103609042","pmid":"https://pubmed.ncbi.nlm.nih.gov/21558156"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btr263","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/27/12/1610/48862821/bioinformatics_27_12_1610.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311647","https://openalex.org/P4310311648"],"host_organization_lineage_names":["University of Oxford","Oxford University Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://academic.oup.com/bioinformatics/article-pdf/27/12/1610/48862821/bioinformatics_27_12_1610.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064626077","display_name":"Justin Bed\u0151","orcid":"https://orcid.org/0000-0001-5704-0212"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]},{"id":"https://openalex.org/I42894916","display_name":"Data61","ror":"https://ror.org/03q397159","country_code":"AU","type":"other","lineage":["https://openalex.org/I1292875679","https://openalex.org/I2801453606","https://openalex.org/I42894916","https://openalex.org/I4387156119"]},{"id":"https://openalex.org/I4210107733","display_name":"Informatique, Biologie Int\u00e9grative et Syst\u00e8mes Complexes","ror":"https://ror.org/01aqxgr98","country_code":"FR","type":"facility","lineage":["https://openalex.org/I277688954","https://openalex.org/I4210107733","https://openalex.org/I88467170"]}],"countries":["AU","FR"],"is_corresponding":false,"raw_author_name":"Justin Bedo","raw_affiliation_strings":["1 National ICT Australia, Victoria Research Laboratories, The University of Melbourne, VIC 3010, Australia and 2Informatique Biologie Int\u00e9grative et Syst\u00e8mes Complexes, Tour Evry II, 523 Place des Terrasses de l'Agora, 91000 Evry, France"],"affiliations":[{"raw_affiliation_string":"1 National ICT Australia, Victoria Research Laboratories, The University of Melbourne, VIC 3010, Australia and 2Informatique Biologie Int\u00e9grative et Syst\u00e8mes Complexes, Tour Evry II, 523 Place des Terrasses de l'Agora, 91000 Evry, France","institution_ids":["https://openalex.org/I165779595","https://openalex.org/I42894916","https://openalex.org/I4210107733","https://openalex.org/I165779595","https://openalex.org/I42894916","https://openalex.org/I4210107733"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101601191","display_name":"Adam Kowalczyk","orcid":"https://orcid.org/0000-0001-9068-3383"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]},{"id":"https://openalex.org/I42894916","display_name":"Data61","ror":"https://ror.org/03q397159","country_code":"AU","type":"other","lineage":["https://openalex.org/I1292875679","https://openalex.org/I2801453606","https://openalex.org/I42894916","https://openalex.org/I4387156119"]},{"id":"https://openalex.org/I4210107733","display_name":"Informatique, Biologie Int\u00e9grative et Syst\u00e8mes Complexes","ror":"https://ror.org/01aqxgr98","country_code":"FR","type":"facility","lineage":["https://openalex.org/I277688954","https://openalex.org/I4210107733","https://openalex.org/I88467170"]}],"countries":["AU","FR"],"is_corresponding":false,"raw_author_name":"Adam Kowalczyk","raw_affiliation_strings":["1 National ICT Australia, Victoria Research Laboratories, The University of Melbourne, VIC 3010, Australia and 2Informatique Biologie Int\u00e9grative et Syst\u00e8mes Complexes, Tour Evry II, 523 Place des Terrasses de l'Agora, 91000 Evry, France"],"affiliations":[{"raw_affiliation_string":"1 National ICT Australia, Victoria Research Laboratories, The University of Melbourne, VIC 3010, Australia and 2Informatique Biologie Int\u00e9grative et Syst\u00e8mes Complexes, Tour Evry II, 523 Place des Terrasses de l'Agora, 91000 Evry, France","institution_ids":["https://openalex.org/I165779595","https://openalex.org/I42894916","https://openalex.org/I4210107733"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":3618,"currency":"USD","value_usd":3618,"provenance":"doaj"},"apc_paid":null,"fwci":0.0,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":65},"biblio":{"volume":"27","issue":"12","first_page":"1610","last_page":"1617"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.63321865}],"concepts":[{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.64157915},{"id":"https://openalex.org/C2775905019","wikidata":"https://www.wikidata.org/wiki/Q192572","display_name":"In silico","level":3,"score":0.633445},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.63321865},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6277001},{"id":"https://openalex.org/C189206191","wikidata":"https://www.wikidata.org/wiki/Q222046","display_name":"Genomics","level":4,"score":0.44811493},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.43768337},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.4277172},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.41936928},{"id":"https://openalex.org/C89566754","wikidata":"https://www.wikidata.org/wiki/Q2273828","display_name":"Genome project","level":4,"score":0.41857833},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24417728},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.22999194},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.19360167},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.11077306}],"mesh":[{"descriptor_ui":"D047369","descriptor_name":"Chromatin Immunoprecipitation","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D004257","descriptor_name":"DNA Polymerase II","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D058977","descriptor_name":"Molecular Sequence Annotation","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D024363","descriptor_name":"Transcription Initiation Site","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001665","descriptor_name":"Binding Sites","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004257","descriptor_name":"DNA Polymerase II","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015894","descriptor_name":"Genome, Human","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D058977","descriptor_name":"Molecular Sequence Annotation","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011401","descriptor_name":"Promoter Regions, Genetic","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D050794","descriptor_name":"STAT1 Transcription Factor","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D050794","descriptor_name":"STAT1 Transcription Factor","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017422","descriptor_name":"Sequence Analysis, DNA","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":"","qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btr263","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/27/12/1610/48862821/bioinformatics_27_12_1610.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311647","https://openalex.org/P4310311648"],"host_organization_lineage_names":["University of Oxford","Oxford University Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/21558156","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btr263","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/27/12/1610/48862821/bioinformatics_27_12_1610.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311647","https://openalex.org/P4310311648"],"host_organization_lineage_names":["University of Oxford","Oxford University Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.51,"display_name":"Partnerships for the goals"},{"id":"https://metadata.un.org/sdg/9","score":0.41,"display_name":"Industry, innovation and infrastructure"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":20,"referenced_works":["https://openalex.org/W1965100590","https://openalex.org/W1976526581","https://openalex.org/W1996212302","https://openalex.org/W2003463914","https://openalex.org/W2011064727","https://openalex.org/W2049569197","https://openalex.org/W2049970533","https://openalex.org/W2082043931","https://openalex.org/W2099961908","https://openalex.org/W2105089812","https://openalex.org/W2105776281","https://openalex.org/W2111400482","https://openalex.org/W2123231299","https://openalex.org/W2130410032","https://openalex.org/W2140948028","https://openalex.org/W2142976423","https://openalex.org/W2148503087","https://openalex.org/W2152100019","https://openalex.org/W2157825442","https://openalex.org/W2166971561"],"related_works":["https://openalex.org/W2957309664","https://openalex.org/W2497609083","https://openalex.org/W2319942811","https://openalex.org/W2135993011","https://openalex.org/W2079600570","https://openalex.org/W2063853667","https://openalex.org/W2047016028","https://openalex.org/W1976142521","https://openalex.org/W142583359","https://openalex.org/W110079389"],"abstract_inverted_index":{"Abstract":[0],"Motivation:":[1],"Many":[2,32],"ChIP-Seq":[3,143],"experiments":[4,35],"are":[5,51,230],"aimed":[6],"at":[7,97,232],"developing":[8],"gold":[9],"standards":[10],"for":[11,85,179],"determining":[12],"the":[13,29,52,118,121,137,168,180,198,217],"locations":[14],"of":[15,56,89,120,133,146,159,171,186,200,213],"various":[16],"genomic":[17],"features":[18],"such":[19,33],"as":[20,48],"transcription":[21,24,189],"start":[22,190],"or":[23],"factor":[25],"binding":[26,150,160],"sites":[27,161],"on":[28,78],"whole":[30,138],"genome.":[31],"pioneering":[34],"lack":[36],"rigorous":[37],"testing":[38],"methods":[39],"and":[40,92,116,148,183],"adequate":[41],"\u2018gold":[42],"standard\u2019":[43],"annotations":[44],"to":[45,95,114,140,216],"compare":[46,117],"against":[47,74,155,176],"they":[49],"themselves":[50],"most":[53],"reliable":[54],"source":[55],"empirical":[57],"data":[58,229],"available.":[59],"To":[60],"overcome":[61],"this":[62,172],"problem,":[63],"we":[64,135],"propose":[65],"a":[66,70,79,90,105,131,210],"self-consistency":[67],"test":[68,128],"whereby":[69],"dataset":[71],"is":[72,153,174],"tested":[73],"itself.":[75],"It":[76],"relies":[77],"supervised":[80,123],"machine":[81],"learning":[82,124],"style":[83],"protocol":[84,139],"in":[86,112,156,187,201],"silico":[87,157,188,202],"annotation":[88,204],"genome":[91,203,215],"accuracy":[93],"estimation":[94],"guarantee,":[96],"least,":[98],"self-consistency.":[99],"Results:":[100],"The":[101],"main":[102,169],"results":[103,195,208],"use":[104],"novel":[106],"performance":[107],"metric":[108],"(a":[109],"calibrated":[110],"precision)":[111],"order":[113],"assess":[115],"robustness":[119],"proposed":[122],"method":[125],"across":[126],"different":[127],"sets.":[129],"As":[130],"proof":[132],"principle,":[134],"applied":[136],"two":[141],"recent":[142],"ENCODE":[144],"datasets":[145],"STAT1":[147,152],"Pol-II":[149],"sites.":[151],"benchmarked":[154,175],"detection":[158],"using":[162],"available":[163,231],"position":[164],"weight":[165],"matrices.":[166],"Pol-II,":[167],"focus":[170],"paper,":[173],"17":[177],"algorithms":[178],"closely":[181],"related":[182],"well-studied":[184],"problem":[185],"site":[191],"(TSS)":[192],"prediction.":[193],"Our":[194],"also":[196],"demonstrate":[197],"feasibility":[199],"extension":[205],"with":[206],"encouraging":[207],"from":[209,221],"small":[211],"portion":[212],"annotated":[214],"remainder.":[218],"Availability:":[219],"Available":[220],"http://www.genomics.csse.unimelb.edu.au/gat.":[222],"Contact:":[223],"justin.bedo@nicta.com.au;":[224],"adam.kowalczyk@nicta.com.au":[225],"Supplementary":[226,228],"Information:":[227],"Bioinformatics":[233],"online.":[234]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2103609042","counts_by_year":[],"updated_date":"2024-12-23T07:47:41.324650","created_date":"2016-06-24"}