{"id":"https://openalex.org/W4380302022","doi":"https://doi.org/10.1609/icwsm.v17i1.22204","title":"Towards Generalization of Machine Learning Models: A Case Study of Arabic Sentiment Analysis","display_name":"Towards Generalization of Machine Learning Models: A Case Study of Arabic Sentiment Analysis","publication_year":2023,"publication_date":"2023-06-02","ids":{"openalex":"https://openalex.org/W4380302022","doi":"https://doi.org/10.1609/icwsm.v17i1.22204"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1609/icwsm.v17i1.22204","pdf_url":null,"source":{"id":"https://openalex.org/S4387284482","display_name":"Proceedings of the International AAAI Conference on Web and Social Media","issn_l":"2162-3449","issn":["2162-3449","2334-0770"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":"https://doi.org/10.1609/icwsm.v17i1.22204","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029823776","display_name":"Samir Abdaljalil","orcid":"https://orcid.org/0009-0009-2183-6193"},"institutions":[{"id":"https://openalex.org/I4210144839","display_name":"Hamad bin Khalifa University","ror":"https://ror.org/03eyq4y97","country_code":"QA","type":"education","lineage":["https://openalex.org/I4210144839"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Samir Abdaljalil","raw_affiliation_strings":["Qatar Computing Research Institute, Hamad Bin Khalifa University, Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute, Hamad Bin Khalifa University, Doha, Qatar","institution_ids":["https://openalex.org/I4210144839"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092142310","display_name":"Shaimaa Hassanein","orcid":null},"institutions":[{"id":"https://openalex.org/I4210150948","display_name":"Zewail City of Science and Technology","ror":"https://ror.org/04w5f4y88","country_code":"EG","type":"education","lineage":["https://openalex.org/I4210150948"]}],"countries":["EG"],"is_corresponding":false,"raw_author_name":"Shaimaa Hassanein","raw_affiliation_strings":["Zewail City of Science and Technology, Giza, Egypt"],"affiliations":[{"raw_affiliation_string":"Zewail City of Science and Technology, Giza, Egypt","institution_ids":["https://openalex.org/I4210150948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102924560","display_name":"Hamdy Mubarak","orcid":"https://orcid.org/0000-0002-9051-6240"},"institutions":[{"id":"https://openalex.org/I4210144839","display_name":"Hamad bin Khalifa University","ror":"https://ror.org/03eyq4y97","country_code":"QA","type":"education","lineage":["https://openalex.org/I4210144839"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Hamdy Mubarak","raw_affiliation_strings":["Qatar Computing Research Institute, Hamad Bin Khalifa University, Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute, Hamad Bin Khalifa University, Doha, Qatar","institution_ids":["https://openalex.org/I4210144839"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047182137","display_name":"Ahmed Abdelal\u00ed","orcid":"https://orcid.org/0000-0002-4160-8181"},"institutions":[{"id":"https://openalex.org/I4210144839","display_name":"Hamad bin Khalifa University","ror":"https://ror.org/03eyq4y97","country_code":"QA","type":"education","lineage":["https://openalex.org/I4210144839"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Ahmed Abdelali","raw_affiliation_strings":["Qatar Computing Research Institute, Hamad Bin Khalifa University, Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute, Hamad Bin Khalifa University, Doha, Qatar","institution_ids":["https://openalex.org/I4210144839"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.352,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":1,"citation_normalized_percentile":{"value":0.606989,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":68,"max":79},"biblio":{"volume":"17","issue":null,"first_page":"971","last_page":"980"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.995,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment Analysis","score":0.6824646},{"id":"https://openalex.org/keywords/modern-standard-arabic","display_name":"Modern Standard Arabic","score":0.5896222},{"id":"https://openalex.org/keywords/emoji","display_name":"Emoji","score":0.47047883}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.76093423},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.70473295},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.6824646},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6388969},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.6171756},{"id":"https://openalex.org/C2778243841","wikidata":"https://www.wikidata.org/wiki/Q56467","display_name":"Modern Standard Arabic","level":3,"score":0.5896222},{"id":"https://openalex.org/C2778121359","wikidata":"https://www.wikidata.org/wiki/Q8096","display_name":"Lexicon","level":2,"score":0.5765343},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.55593723},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.5479139},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5426186},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5296623},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.52473813},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.47134134},{"id":"https://openalex.org/C2779247141","wikidata":"https://www.wikidata.org/wiki/Q1049294","display_name":"Emoji","level":3,"score":0.47047883},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.12837854},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12167594},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.12155524},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1609/icwsm.v17i1.22204","pdf_url":null,"source":{"id":"https://openalex.org/S4387284482","display_name":"Proceedings of the International AAAI Conference on Web and Social Media","issn_l":"2162-3449","issn":["2162-3449","2334-0770"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1609/icwsm.v17i1.22204","pdf_url":null,"source":{"id":"https://openalex.org/S4387284482","display_name":"Proceedings of the International AAAI Conference on Web and Social Media","issn_l":"2162-3449","issn":["2162-3449","2334-0770"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":31,"referenced_works":["https://openalex.org/W1933546049","https://openalex.org/W2043287290","https://openalex.org/W2250594687","https://openalex.org/W2464521204","https://openalex.org/W2516105622","https://openalex.org/W2594612414","https://openalex.org/W2751156688","https://openalex.org/W2766332866","https://openalex.org/W2890931798","https://openalex.org/W2901858379","https://openalex.org/W2901922204","https://openalex.org/W2902255491","https://openalex.org/W2944430231","https://openalex.org/W2964260444","https://openalex.org/W2970515934","https://openalex.org/W2982446111","https://openalex.org/W3003508021","https://openalex.org/W3003675680","https://openalex.org/W3016055861","https://openalex.org/W3037943408","https://openalex.org/W3088315964","https://openalex.org/W3098239359","https://openalex.org/W3103646405","https://openalex.org/W3155658398","https://openalex.org/W3199361187","https://openalex.org/W3207671820","https://openalex.org/W38739846","https://openalex.org/W4200310290","https://openalex.org/W4287862831","https://openalex.org/W4386506836","https://openalex.org/W4398301389"],"related_works":["https://openalex.org/W4362496363","https://openalex.org/W4200238620","https://openalex.org/W3205826705","https://openalex.org/W3119550360","https://openalex.org/W2975174210","https://openalex.org/W2903394456","https://openalex.org/W2902285665","https://openalex.org/W2888662092","https://openalex.org/W2770617756","https://openalex.org/W2244029015"],"abstract_inverted_index":{"The":[0],"abundance":[1],"of":[2,38,53,96,111,145,160,193,233,240],"social":[3],"media":[4],"data":[5,23,99,227],"in":[6,75,84,100,149,261],"the":[7,51,85,94,143,179,209,217,220,225],"Arab":[8],"world,":[9],"specifically":[10],"on":[11,120,208,247,264],"Twitter,":[12],"enabled":[13],"companies":[14],"and":[15,21,28,36,98,113,153,165,201,219,235,237,242],"entities":[16],"to":[17,30,59,104,125,169,270],"exploit":[18],"such":[19],"rich":[20],"beneficial":[22],"that":[24,56,117,141,178,197,203],"could":[25],"be":[26,170],"mined":[27],"used":[29,171],"extract":[31],"important":[32],"information,":[33],"including":[34],"sentiments":[35],"opinions":[37],"people":[39],"towards":[40],"a":[41,44,109,155,186,190],"topic":[42],"or":[43],"merchandise.":[45],"However,":[46],"with":[47,102,131],"this":[48,90],"plenitude":[49],"comes":[50],"issue":[52],"producing":[54],"models":[55,97,116,148,222,254],"are":[57,118],"able":[58],"deliver":[60],"consistent":[61,181],"outcomes":[62],"when":[63,129,245],"tested":[64,119],"within":[65],"various":[66],"contexts.":[67],"Although":[68],"model":[69,182,272],"generalization":[70,95,144,273],"has":[71,79],"been":[72,81],"thoroughly":[73],"investigated":[74,83],"many":[76],"fields,":[77],"it":[78],"not":[80],"heavily":[82],"Arabic":[86,101,150,163,210],"context.":[87],"To":[88],"address":[89],"gap,":[91],"we":[92,137,267],"investigate":[93],"application":[103],"sentiment":[105,151,168],"analysis,":[106,152],"by":[107,189,255],"performing":[108],"battery":[110],"experiments":[112,176],"building":[114],"different":[115,139],"five":[121,248],"independent":[122],"test":[123,250],"sets":[124],"understand":[126],"their":[127,166],"performance":[128],"presented":[130],"unseen":[132],"data.":[133],"In":[134],"doing":[135],"so,":[136],"detail":[138],"techniques":[140],"improve":[142,271],"machine":[146],"learning":[147],"share":[154,268],"large":[156],"versatile":[157],"dataset":[158,187],"consisting":[159],"approximately":[161],"1.64M":[162],"tweets":[164,200,206],"corresponding":[167],"for":[172,274],"future":[173],"research.":[174],"Our":[175],"concluded":[177],"most":[180],"is":[183],"trained":[184,223],"using":[185,224],"labelled":[188],"cascaded":[191],"approach":[192],"two":[194],"models,":[195],"one":[196],"labels":[198],"neutral":[199],"another":[202],"identifies":[204],"positive/negative":[205],"based":[207],"emoji":[211],"lexicon":[212],"after":[213],"class":[214],"balancing.":[215],"Both":[216],"BERT":[218],"SVM":[221],"refined":[226],"achieve":[228],"an":[229],"average":[230],"F-1":[231],"score":[232],"0.62":[234],"0.60,":[236],"standard":[238],"deviation":[239],"0.06":[241],"0.04":[243],"respectively,":[244],"evaluated":[246],"diverse":[249],"sets,":[251],"outperforming":[252],"other":[253],"at":[256],"least":[257],"17%":[258],"relative":[259],"gain":[260],"F-1.":[262],"Based":[263],"our":[265],"experiments,":[266],"recommendations":[269],"classification":[275],"tasks.":[276]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4380302022","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2024-12-11T19:54:34.199907","created_date":"2023-06-13"}