{"id":"https://openalex.org/W2151595407","doi":"https://doi.org/10.4304/jcp.7.12.2913-2920","title":"An Improved Random Forest Classifier for Text Categorization","display_name":"An Improved Random Forest Classifier for Text Categorization","publication_year":2012,"publication_date":"2012-12-01","ids":{"openalex":"https://openalex.org/W2151595407","doi":"https://doi.org/10.4304/jcp.7.12.2913-2920","mag":"2151595407"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.4304/jcp.7.12.2913-2920","pdf_url":null,"source":{"id":"https://openalex.org/S77894049","display_name":"Journal of Computers","issn_l":"1796-203X","issn":["1796-203X"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318660","host_organization_name":"Academy Publisher","host_organization_lineage":["https://openalex.org/P4310318660"],"host_organization_lineage_names":["Academy Publisher"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053591377","display_name":"Baoxun Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baoxun Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075351142","display_name":"Guo Xiu-feng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiufeng Guo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002523892","display_name":"Yunming Ye","orcid":"https://orcid.org/0000-0002-1807-8581"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yunming Ye","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5103340525","display_name":"Jiefeng Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiefeng Cheng","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.444,"has_fulltext":false,"cited_by_count":160,"citation_normalized_percentile":{"value":0.949002,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"7","issue":"12","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9893,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9887,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/text-categorization","display_name":"Text Categorization","score":0.494252}],"concepts":[{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.8347317},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.6469988},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.63388515},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5709136},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5187443},{"id":"https://openalex.org/C2986744138","wikidata":"https://www.wikidata.org/wiki/Q302088","display_name":"Text categorization","level":3,"score":0.494252},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.43563586},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43023595}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.4304/jcp.7.12.2913-2920","pdf_url":null,"source":{"id":"https://openalex.org/S77894049","display_name":"Journal of Computers","issn_l":"1796-203X","issn":["1796-203X"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318660","host_organization_name":"Academy Publisher","host_organization_lineage":["https://openalex.org/P4310318660"],"host_organization_lineage_names":["Academy Publisher"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.72,"id":"https://metadata.un.org/sdg/15","display_name":"Life on land"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":18,"referenced_works":["https://openalex.org/W140312209","https://openalex.org/W1500332810","https://openalex.org/W1550206324","https://openalex.org/W1570448133","https://openalex.org/W1972640883","https://openalex.org/W1982589161","https://openalex.org/W2005422315","https://openalex.org/W2043175314","https://openalex.org/W2063198646","https://openalex.org/W2071664212","https://openalex.org/W2112076978","https://openalex.org/W2149684865","https://openalex.org/W2165888424","https://openalex.org/W2469781980","https://openalex.org/W2911964244","https://openalex.org/W2976840617","https://openalex.org/W385173559","https://openalex.org/W592246762"],"related_works":["https://openalex.org/W2889302474","https://openalex.org/W2390857744","https://openalex.org/W2390698788","https://openalex.org/W2383063829","https://openalex.org/W2360898036","https://openalex.org/W2138922887","https://openalex.org/W2133651098","https://openalex.org/W2125109223","https://openalex.org/W2082678934","https://openalex.org/W2035261173"],"abstract_inverted_index":{"This":[0,12],"paper":[1],"proposes":[2],"an":[3],"improved":[4,108],"random":[5,49,109],"forest":[6,50],"algorithm":[7,13],"for":[8,17,47,68],"classifying":[9],"text":[10,31,56,96,114],"data.":[11],"is":[14,30],"particularly":[15],"designed":[16],"analyzing":[18],"very":[19],"high":[20],"dimensional":[21],"data":[22,29,97],"with":[23,58,99],"multiple":[24],"classes":[25],"whose":[26],"well-known":[27],"representative":[28],"corpus.":[32],"A":[33],"novel":[34],"feature":[35,65],"weighting":[36,66],"method":[37,41,67,93],"and":[38,44,71,81],"tree":[39,72],"selection":[40,73],"are":[42],"developed":[43],"synergistically":[45],"served":[46],"making":[48],"framework":[51],"well":[52],"suited":[53],"to":[54],"categorize":[55],"documents":[57],"dozens":[59],"of":[60,119],"topics.":[61],"With":[62],"the":[63,91,112],"new":[64],"subspace":[69,79],"sampling":[70],"method,":[74],"we":[75],"can":[76],"effectively":[77],"reduce":[78],"size":[80],"improve":[82],"classification":[83,115,120],"performance":[84],"without":[85],"increasing":[86],"error":[87],"bound.":[88],"We":[89],"apply":[90],"proposed":[92],"on":[94],"six":[95],"sets":[98],"diverse":[100],"characteristics.":[101],"The":[102],"results":[103],"have":[104],"demonstrated":[105],"that":[106],"this":[107],"forests":[110],"outperformed":[111],"popular":[113],"methods":[116],"in":[117],"terms":[118],"performance.":[121]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2151595407","counts_by_year":[{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":17},{"year":2022,"cited_by_count":30},{"year":2021,"cited_by_count":28},{"year":2020,"cited_by_count":26},{"year":2019,"cited_by_count":19},{"year":2018,"cited_by_count":13},{"year":2017,"cited_by_count":9},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":2}],"updated_date":"2024-12-14T09:19:01.226544","created_date":"2016-06-24"}