{"id":"https://openalex.org/W4285116762","doi":"https://doi.org/10.18653/v1/2022.acl-long.459","title":"SHIELD: Defending Textual Neural Networks against Multiple Black-Box Adversarial Attacks with Stochastic Multi-Expert Patcher","display_name":"SHIELD: Defending Textual Neural Networks against Multiple Black-Box Adversarial Attacks with Stochastic Multi-Expert Patcher","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4285116762","doi":"https://doi.org/10.18653/v1/2022.acl-long.459"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2022.acl-long.459","pdf_url":"https://aclanthology.org/2022.acl-long.459.pdf","source":{"id":"https://openalex.org/S4363608652","display_name":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://aclanthology.org/2022.acl-long.459.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039440984","display_name":"Thai Le","orcid":"https://orcid.org/0000-0001-9632-6870"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]},{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR","US"],"is_corresponding":false,"raw_author_name":"Thai Le","raw_affiliation_strings":["Noseong Park Yonsei University","Penn State University"],"affiliations":[{"raw_affiliation_string":"Penn State University","institution_ids":["https://openalex.org/I130769515","https://openalex.org/I130769515"]},{"raw_affiliation_string":"Noseong Park Yonsei University","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067253588","display_name":"Noseong Park","orcid":"https://orcid.org/0000-0002-1268-840X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Noseong Park","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100405086","display_name":"Dongwon Lee","orcid":"https://orcid.org/0000-0001-8371-7629"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]},{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR","US"],"is_corresponding":false,"raw_author_name":"Dongwon Lee","raw_affiliation_strings":["Noseong Park Yonsei University","Penn State University"],"affiliations":[{"raw_affiliation_string":"Penn State University","institution_ids":["https://openalex.org/I130769515","https://openalex.org/I130769515"]},{"raw_affiliation_string":"Noseong Park Yonsei University","institution_ids":["https://openalex.org/I193775966"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.606,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":11,"citation_normalized_percentile":{"value":0.999875,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":92,"max":93},"biblio":{"volume":null,"issue":null,"first_page":"6661","last_page":"6674"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9044,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/black-box","display_name":"Black box","score":0.56260014},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep Neural Networks","score":0.44902456}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7872948},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.7004818},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.61723936},{"id":"https://openalex.org/C94966114","wikidata":"https://www.wikidata.org/wiki/Q29256","display_name":"Black box","level":2,"score":0.56260014},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.55783117},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5251895},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5232938},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.47709352},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.44902456},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3493927},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.30646402},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09080675},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08043581},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2022.acl-long.459","pdf_url":"https://aclanthology.org/2022.acl-long.459.pdf","source":{"id":"https://openalex.org/S4363608652","display_name":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2011.08908","pdf_url":"https://arxiv.org/pdf/2011.08908","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2022.acl-long.459","pdf_url":"https://aclanthology.org/2022.acl-long.459.pdf","source":{"id":"https://openalex.org/S4363608652","display_name":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":59,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1832693441","https://openalex.org/W1902237438","https://openalex.org/W1924770834","https://openalex.org/W1945616565","https://openalex.org/W2115122836","https://openalex.org/W2133564696","https://openalex.org/W2180612164","https://openalex.org/W2250539671","https://openalex.org/W2547875792","https://openalex.org/W2560440203","https://openalex.org/W2595653137","https://openalex.org/W2765407302","https://openalex.org/W2766108848","https://openalex.org/W2785699986","https://openalex.org/W2794557536","https://openalex.org/W2799194071","https://openalex.org/W2896457183","https://openalex.org/W2911510572","https://openalex.org/W2912070915","https://openalex.org/W2926587947","https://openalex.org/W2947415936","https://openalex.org/W2949128310","https://openalex.org/W2951104886","https://openalex.org/W2952186591","https://openalex.org/W2962718684","https://openalex.org/W2962818281","https://openalex.org/W2963126845","https://openalex.org/W2963283805","https://openalex.org/W2963859254","https://openalex.org/W2965373594","https://openalex.org/W2965595599","https://openalex.org/W2970078867","https://openalex.org/W2971524212","https://openalex.org/W2972619028","https://openalex.org/W2976345833","https://openalex.org/W2982054702","https://openalex.org/W2997645422","https://openalex.org/W3034445277","https://openalex.org/W3035507081","https://openalex.org/W3035736465","https://openalex.org/W3084992427","https://openalex.org/W3096609285","https://openalex.org/W3099803414","https://openalex.org/W3101449015","https://openalex.org/W3104423855","https://openalex.org/W3105604018","https://openalex.org/W3120061794","https://openalex.org/W3127569499","https://openalex.org/W3155936402","https://openalex.org/W3169948074","https://openalex.org/W3173261519","https://openalex.org/W3173596483","https://openalex.org/W3175982906","https://openalex.org/W3176648901","https://openalex.org/W3177190797","https://openalex.org/W4288089799","https://openalex.org/W4288594304","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W4313346231","https://openalex.org/W4285785480","https://openalex.org/W3203790781","https://openalex.org/W3093978547","https://openalex.org/W3080754722","https://openalex.org/W3009622996","https://openalex.org/W2997056298","https://openalex.org/W2953536436","https://openalex.org/W2950183588","https://openalex.org/W2738001131"],"abstract_inverted_index":{"Even":[0],"though":[1],"several":[2],"methods":[3],"have":[4],"proposed":[5],"to":[6,35,69,120,209],"defend":[7,19],"textual":[8,89,177],"neural":[9],"network":[10],"(NN)":[11],"models":[12,30,50],"against":[13,20,193],"black-box":[14,113,196],"adversarial":[15,123],"attacks,":[16,197],"they":[17],"often":[18],"a":[21,36,75,88,100,146,154,184],"specific":[22],"text":[23],"perturbation":[24],"strategy":[25],"and/or":[26],"require":[27,54],"re-training":[28],"the":[29,47,84,97,127,139,150],"from":[31,64],"scratch.":[32],"This":[33],"leads":[34],"lack":[37],"of":[38,87,104,111,135,149,171,187],"generalization":[39],"in":[40,67,189],"practice":[41],"and":[42,57,81,91,95,175],"redundant":[43],"computation.":[44],"In":[45,141],"particular,":[46],"state-of-the-art":[48],"transformer":[49],"(e.g.,":[51],"BERT,":[52,174],"RoBERTa)":[53],"great":[55],"time":[56],"computation":[58],"resources.":[59],"By":[60,163],"borrowing":[61],"an":[62,161],"idea":[63],"software":[65],"engineering,":[66],"order":[68],"address":[70],"these":[71],"limitations,":[72],"we":[73,167],"propose":[74],"novel":[76],"algorithm,":[77],"SHIELD,":[78,182],"which":[79,152],"modifies":[80],"re-trains":[82],"only":[83],"last":[85],"layer":[86],"NN,":[90],"thus":[92],"it":[93],"\"patches\"":[94],"\"transforms\"":[96],"NN":[98,156],"into":[99],"stochastic":[101],"weighted":[102,133],"ensemble":[103],"multi-expert":[105],"prediction":[106],"heads.":[107],"Considering":[108],"that":[109,169],"most":[110],"current":[112],"attacks":[114],"rely":[115],"on":[116,138,191],"iterative":[117],"search":[118],"mechanisms":[119],"optimize":[121],"their":[122],"perturbations,":[124],"SHIELD":[125,144],"confuses":[126],"attackers":[128],"by":[129,181],"automatically":[130],"utilizing":[131],"different":[132,195],"ensembles":[134],"predictors":[136],"depending":[137],"input.":[140],"other":[142],"words,":[143],"breaks":[145],"fundamental":[147],"assumption":[148],"attack,":[151],"is":[153],"victim":[155],"model":[157],"remains":[158],"constant":[159],"during":[160],"attack.":[162],"conducting":[164],"comprehensive":[165],"experiments,":[166],"demonstrate":[168],"all":[170],"CNN,":[172],"RNN,":[173],"RoBERTa-based":[176],"NNs,":[178],"once":[179],"patched":[180],"exhibit":[183],"relative":[185],"enhancement":[186],"15%\u201370%":[188],"accuracy":[190],"average":[192],"14":[194],"outperforming":[198],"6":[199],"defensive":[200],"baselines":[201],"across":[202],"3":[203],"public":[204],"datasets.":[205],"All":[206],"codes":[207],"are":[208],"be":[210],"released.":[211]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4285116762","counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1}],"updated_date":"2024-12-10T04:34:19.000219","created_date":"2022-07-14"}