{"id":"https://openalex.org/W2087093841","doi":"https://doi.org/10.1109/icmla.2011.71","title":"Frequent Substring-Based Sequence Classification with an Ensemble of Support Vector Machines Trained Using Reduced Amino Acid Alphabets","display_name":"Frequent Substring-Based Sequence Classification with an Ensemble of Support Vector Machines Trained Using Reduced Amino Acid Alphabets","publication_year":2011,"publication_date":"2011-12-01","ids":{"openalex":"https://openalex.org/W2087093841","doi":"https://doi.org/10.1109/icmla.2011.71","mag":"2087093841"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla.2011.71","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032293659","display_name":"Charith Chitraranjan","orcid":"https://orcid.org/0000-0003-3205-2211"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"funder","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"C. D. Chitraranjan","raw_affiliation_strings":["North Dakota State Univ.#TAB#"],"affiliations":[{"raw_affiliation_string":"North Dakota State Univ.#TAB#","institution_ids":["https://openalex.org/I57328836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082116090","display_name":"Loai Alnemer","orcid":"https://orcid.org/0000-0002-1208-9861"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"funder","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"L. Alnemer","raw_affiliation_strings":["North Dakota State Univ.#TAB#"],"affiliations":[{"raw_affiliation_string":"North Dakota State Univ.#TAB#","institution_ids":["https://openalex.org/I57328836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082969875","display_name":"Omar Al-Azzam","orcid":"https://orcid.org/0009-0000-4460-5608"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"funder","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"O. Al-Azzam","raw_affiliation_strings":["North Dakota State Univ.#TAB#"],"affiliations":[{"raw_affiliation_string":"North Dakota State Univ.#TAB#","institution_ids":["https://openalex.org/I57328836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091100480","display_name":"Saeed Salem","orcid":"https://orcid.org/0000-0001-6478-4674"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"funder","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"S. Salem","raw_affiliation_strings":["North Dakota State Univ.#TAB#"],"affiliations":[{"raw_affiliation_string":"North Dakota State Univ.#TAB#","institution_ids":["https://openalex.org/I57328836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041754762","display_name":"Anne Denton","orcid":"https://orcid.org/0000-0002-2135-9501"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"funder","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"A. M. Denton","raw_affiliation_strings":["North Dakota State Univ.#TAB#"],"affiliations":[{"raw_affiliation_string":"North Dakota State Univ.#TAB#","institution_ids":["https://openalex.org/I57328836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101668449","display_name":"Muhammad Javed Iqbal","orcid":"https://orcid.org/0000-0002-2035-4004"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"funder","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"M. J. Iqbal","raw_affiliation_strings":["North Dakota State Univ.#TAB#"],"affiliations":[{"raw_affiliation_string":"North Dakota State Univ.#TAB#","institution_ids":["https://openalex.org/I57328836"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031755661","display_name":"Shahryar F. Kianian","orcid":"https://orcid.org/0000-0003-4968-3140"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"funder","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"S. F. Kianian","raw_affiliation_strings":["Dept. of Plant Sci., North Dakota State Univ. Fargo, Fargo, ND, USA"],"affiliations":[{"raw_affiliation_string":"Dept. of Plant Sci., North Dakota State Univ. Fargo, Fargo, ND, USA","institution_ids":["https://openalex.org/I57328836"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.587,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":4,"citation_normalized_percentile":{"value":0.790733,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":78,"max":80},"biblio":{"volume":null,"issue":null,"first_page":"180","last_page":"185"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9984,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/substring","display_name":"Substring","score":0.8161131},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.5321184}],"concepts":[{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.81801486},{"id":"https://openalex.org/C182407805","wikidata":"https://www.wikidata.org/wiki/Q2626534","display_name":"Substring","level":3,"score":0.8161131},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6450845},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6414156},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.61351246},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.60614103},{"id":"https://openalex.org/C113238511","wikidata":"https://www.wikidata.org/wiki/Q1071612","display_name":"k-nearest neighbors algorithm","level":2,"score":0.58399546},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.5321184},{"id":"https://openalex.org/C2986374874","wikidata":"https://www.wikidata.org/wiki/Q8054","display_name":"Protein function","level":3,"score":0.4420211},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.22596174},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.14389876},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.115749806},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.075713515},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla.2011.71","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality education","score":0.8,"id":"https://metadata.un.org/sdg/4"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":33,"referenced_works":["https://openalex.org/W1539117683","https://openalex.org/W1574862351","https://openalex.org/W193142705","https://openalex.org/W1973101413","https://openalex.org/W1973626596","https://openalex.org/W198434325","https://openalex.org/W1997102766","https://openalex.org/W1998300401","https://openalex.org/W1999766624","https://openalex.org/W2007425502","https://openalex.org/W2020816856","https://openalex.org/W2034271244","https://openalex.org/W2049877533","https://openalex.org/W2055043387","https://openalex.org/W2084959893","https://openalex.org/W2086173258","https://openalex.org/W2093519658","https://openalex.org/W2097892623","https://openalex.org/W2107856523","https://openalex.org/W2112865076","https://openalex.org/W2119027485","https://openalex.org/W2119290215","https://openalex.org/W2127941101","https://openalex.org/W2130253098","https://openalex.org/W2143210482","https://openalex.org/W2143507938","https://openalex.org/W2154202919","https://openalex.org/W2156909104","https://openalex.org/W2166962853","https://openalex.org/W26001942","https://openalex.org/W4231686096","https://openalex.org/W4236236547","https://openalex.org/W46826290"],"related_works":["https://openalex.org/W2935275081","https://openalex.org/W2159663778","https://openalex.org/W2135470984","https://openalex.org/W2096697992","https://openalex.org/W2092160131","https://openalex.org/W2082535576","https://openalex.org/W2065993463","https://openalex.org/W2017375993","https://openalex.org/W2015809665","https://openalex.org/W1568877569"],"abstract_inverted_index":{"We":[0,20,61],"propose":[1],"a":[2],"frequent":[3,94],"pattern-based":[4],"algorithm":[5,67],"for":[6,140],"predicting":[7],"functions":[8],"and":[9,51,72,80,111],"localizations":[10],"of":[11,29,59,65,132,142],"proteins":[12],"from":[13,43],"their":[14],"primary":[15],"structure":[16],"(amino":[17],"acid":[18],"sequence).":[19],"use":[21,131],"reduced":[22,133],"alphabets":[23,134],"that":[24,34,92,129],"capture":[25],"the":[26,44,63,93,107,116,121,130,143],"higher":[27],"rate":[28],"substitution":[30],"between":[31],"amino":[32],"acids":[33],"are":[35,41,85],"physiochemically":[36],"similar.":[37],"Frequent":[38],"sub":[39,95],"strings":[40],"mined":[42],"training":[45],"sequences,":[46],"transformed":[47],"into":[48],"different":[49],"alphabets,":[50],"used":[52],"as":[53,87],"features":[54],"to":[55],"train":[56],"an":[57],"ensemble":[58],"SVMs.":[60],"evaluate":[62],"performance":[64,101,138],"our":[66],"using":[68],"protein":[69,73,122],"sub-cellular":[70,108],"localization":[71,109],"function":[74,123],"datasets.":[75,124],"Pair-wise":[76],"sequence-alignment-based":[77],"nearest":[78,117],"neighbor":[79,118],"basic":[81],"SVM":[82,97],"k-gram":[83],"classifiers":[84,105],"included":[86],"comparison":[88],"algorithms.":[89],"Results":[90],"show":[91,128],"string-based":[96],"classifier":[98,119],"demonstrates":[99],"better":[100],"compared":[102],"with":[103,115],"other":[104],"on":[106,120],"datasets":[110],"it":[112],"performs":[113],"competitively":[114],"Our":[125],"results":[126],"also":[127],"provides":[135],"statistically":[136],"significant":[137],"improvements":[139],"half":[141],"classes":[144],"studied.":[145]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2087093841","counts_by_year":[{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-03-18T18:52:26.965018","created_date":"2016-06-24"}