{"id":"https://openalex.org/W2043797302","doi":"https://doi.org/10.1186/1471-2105-11-445","title":"Automatic detection of anchor points for multiple sequence alignment","display_name":"Automatic detection of anchor points for multiple sequence alignment","publication_year":2010,"publication_date":"2010-09-02","ids":{"openalex":"https://openalex.org/W2043797302","doi":"https://doi.org/10.1186/1471-2105-11-445","mag":"2043797302","pmid":"https://pubmed.ncbi.nlm.nih.gov/20813050","pmcid":"https://www.ncbi.nlm.nih.gov/pmc/articles/2942857"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-11-445","pdf_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/1471-2105-11-445","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310320256"],"host_organization_lineage_names":["Springer Nature","BioMed Central"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/1471-2105-11-445","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041679690","display_name":"Florian Pitschi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210121447","display_name":"Center for Excellence in Molecular Cell Science","ror":"https://ror.org/02rrdvm96","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210121447"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Florian Pitschi","raw_affiliation_strings":["Partner Institute for Computational Biology, CAS-MPG, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Partner Institute for Computational Biology, CAS-MPG, Shanghai, China","institution_ids":["https://openalex.org/I4210121447"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022701865","display_name":"Claudine Devauchelle","orcid":null},"institutions":[{"id":"https://openalex.org/I88467170","display_name":"Universit\u00e9 d'\u00c9vry Val-d'Essonne","ror":"https://ror.org/00e96v939","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954","https://openalex.org/I88467170"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Claudine Devauchelle","raw_affiliation_strings":["Laboratoire Statistique et G\u00e9nome (LSG), CNRS UMR 8071, INRA 1152, Universit\u00e9 d'Evry, Evry Cedex, France"],"affiliations":[{"raw_affiliation_string":"Laboratoire Statistique et G\u00e9nome (LSG), CNRS UMR 8071, INRA 1152, Universit\u00e9 d'Evry, Evry Cedex, France","institution_ids":["https://openalex.org/I88467170","https://openalex.org/I1294671590"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033278582","display_name":"Eduardo Corel","orcid":"https://orcid.org/0000-0003-4410-9035"},"institutions":[{"id":"https://openalex.org/I74656192","display_name":"University of G\u00f6ttingen","ror":"https://ror.org/01y9bpm73","country_code":"DE","type":"funder","lineage":["https://openalex.org/I74656192"]},{"id":"https://openalex.org/I88467170","display_name":"Universit\u00e9 d'\u00c9vry Val-d'Essonne","ror":"https://ror.org/00e96v939","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954","https://openalex.org/I88467170"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]}],"countries":["DE","FR"],"is_corresponding":false,"raw_author_name":"Eduardo Corel","raw_affiliation_strings":["Georg-August-Universit\u00e4t, Institut f\u00fcr Mikrobiologie und Genetik, G\u00f6ttingen, Germany","Laboratoire Statistique et G\u00e9nome (LSG), CNRS UMR 8071, INRA 1152, Universit\u00e9 d'Evry, Evry Cedex, France"],"affiliations":[{"raw_affiliation_string":"Georg-August-Universit\u00e4t, Institut f\u00fcr Mikrobiologie und Genetik, G\u00f6ttingen, Germany","institution_ids":["https://openalex.org/I74656192"]},{"raw_affiliation_string":"Laboratoire Statistique et G\u00e9nome (LSG), CNRS UMR 8071, INRA 1152, Universit\u00e9 d'Evry, Evry Cedex, France","institution_ids":["https://openalex.org/I88467170","https://openalex.org/I1294671590"]}]}],"institution_assertions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":0.4,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":8,"citation_normalized_percentile":{"value":0.610922,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":83,"max":84},"biblio":{"volume":"11","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9962,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9933,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/multiple-sequence-alignment","display_name":"Multiple sequence alignment","score":0.80096734},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7756289},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5505892},{"id":"https://openalex.org/keywords/alignment-free-sequence-analysis","display_name":"Alignment-free sequence analysis","score":0.49954867},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4954492},{"id":"https://openalex.org/keywords/smith\u2013waterman-algorithm","display_name":"Smith\u2013Waterman algorithm","score":0.44309276},{"id":"https://openalex.org/keywords/structural-alignment","display_name":"Structural alignment","score":0.44143716},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4180606}],"concepts":[{"id":"https://openalex.org/C88031987","wikidata":"https://www.wikidata.org/wiki/Q1377767","display_name":"Multiple sequence alignment","level":5,"score":0.80096734},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7756289},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.76151425},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7355283},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.55248404},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5505892},{"id":"https://openalex.org/C180384323","wikidata":"https://www.wikidata.org/wiki/Q16335137","display_name":"Alignment-free sequence analysis","level":5,"score":0.49954867},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4954492},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.48022395},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.46663982},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4553145},{"id":"https://openalex.org/C72802188","wikidata":"https://www.wikidata.org/wiki/Q1683352","display_name":"Smith\u2013Waterman algorithm","level":5,"score":0.44309276},{"id":"https://openalex.org/C4668613","wikidata":"https://www.wikidata.org/wiki/Q4116110","display_name":"Structural alignment","level":5,"score":0.44143716},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43349263},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4303699},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4180606},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.34268582},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.27932313},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.19039467},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.07595652},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017422","descriptor_name":"Sequence Analysis, DNA","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017422","descriptor_name":"Sequence Analysis, DNA","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":"","qualifier_name":null,"is_major_topic":false}],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-11-445","pdf_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/1471-2105-11-445","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310320256"],"host_organization_lineage_names":["Springer Nature","BioMed Central"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC2942857","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/20813050","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-11-445","pdf_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/1471-2105-11-445","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310320256"],"host_organization_lineage_names":["Springer Nature","BioMed Central"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.43}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":25,"referenced_works":["https://openalex.org/W1592870802","https://openalex.org/W1991330646","https://openalex.org/W2033339460","https://openalex.org/W2052831012","https://openalex.org/W2056176729","https://openalex.org/W2091134657","https://openalex.org/W2107248520","https://openalex.org/W2108187446","https://openalex.org/W2113213844","https://openalex.org/W2121669452","https://openalex.org/W2127774996","https://openalex.org/W2128442209","https://openalex.org/W2132926880","https://openalex.org/W2133783550","https://openalex.org/W2136570298","https://openalex.org/W2137015675","https://openalex.org/W2140292630","https://openalex.org/W2143357251","https://openalex.org/W2143796933","https://openalex.org/W2144362290","https://openalex.org/W2147996827","https://openalex.org/W2152688507","https://openalex.org/W2510854709","https://openalex.org/W3098719287","https://openalex.org/W3150974748"],"related_works":["https://openalex.org/W2948014085","https://openalex.org/W2762798190","https://openalex.org/W2759306076","https://openalex.org/W2501018882","https://openalex.org/W2351540725","https://openalex.org/W2158700816","https://openalex.org/W2145549598","https://openalex.org/W2051969447","https://openalex.org/W2043797302","https://openalex.org/W187239587"],"abstract_inverted_index":{"Abstract":[0],"Background":[1],"Determining":[2],"beforehand":[3],"specific":[4],"positions":[5,87,113,132],"to":[6,31,48,78,103,128],"align":[7],"(":[8],"anchor":[9,195],"points":[10],")":[11],"has":[12],"proved":[13],"valuable":[14],"for":[15,149],"the":[16,66,89,106,134,150,171,178,187,199,201,204,208],"accuracy":[17,202],"of":[18,68,86,94,108,112,173,189,203],"automated":[19],"multiple":[20,59,80,142],"sequence":[21],"alignment":[22,192],"(MSA)":[23],"software.":[24],"This":[25],"feature":[26],"can":[27,62,146],"be":[28,46,49,147],"used":[29],"manually":[30],"include":[32],"biological":[33],"expertise,":[34],"or":[35],"automatically,":[36],"usually":[37],"by":[38,156],"pairwise":[39],"similarity":[40],"searches.":[41],"Multiple":[42],"local":[43,60,81],"similarities":[44,61],"are":[45,138],"expected":[47],"more":[50,53],"adequate,":[51],"as":[52,153,194],"biologically":[54],"relevant.":[55],"However,":[56],"even":[57],"good":[58],"prove":[63],"incompatible":[64],"with":[65,105,140],"ordering":[67],"an":[69,120],"alignment.":[70,121,143],"Results":[71],"We":[72,122,167,184],"use":[73],"a":[74,125,141,157],"recently":[75],"developed":[76],"algorithm":[77,127],"detect":[79,129],"similarities,":[82],"which":[83],"returns":[84],"subsets":[85,111],"in":[88,119,133],"sequences":[90],"sharing":[91],"similar":[92],"contexts":[93],"appearence.":[95],"In":[96],"this":[97,109],"paper,":[98],"we":[99],"describe":[100],"first":[101],"how":[102],"get,":[104],"help":[107],"method,":[110],"that":[114,137,186],"could":[115],"form":[116],"partial":[117,135,191],"columns":[118,136,145,176],"introduce":[123],"next":[124],"graph-theoretic":[126],"(and":[130],"remove)":[131],"inconsistent":[139],"Partial":[144],"used,":[148],"time":[151],"being,":[152],"guide":[154],"only":[155],"few":[158],"MSA":[159],"programs:":[160],"ClustalW":[161,206],"2.0,":[162],"DIALIGN":[163],"2":[164],"and":[165],"T-Coffee.":[166],"perform":[168],"tests":[169],"on":[170,177,198,207],"effect":[172],"introducing":[174],"these":[175],"popular":[179],"benchmark":[180,209],"BAliBASE":[181,210],"3.":[182,211],"Conclusions":[183],"show":[185],"inclusion":[188],"our":[190],"columns,":[193],"points,":[196],"improve":[197],"whole":[200],"aligner":[205]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2043797302","counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-03-21T00:38:55.647258","created_date":"2016-06-24"}