{"id":"https://openalex.org/W4403159732","doi":"https://doi.org/10.48550/arxiv.2408.02946","title":"Scaling Laws for Data Poisoning in LLMs","display_name":"Scaling Laws for Data Poisoning in LLMs","publication_year":2024,"publication_date":"2024-08-06","ids":{"openalex":"https://openalex.org/W4403159732","doi":"https://doi.org/10.48550/arxiv.2408.02946"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.02946","pdf_url":"http://arxiv.org/pdf/2408.02946","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2408.02946","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111354805","display_name":"Dillon Bowen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bowen, Dillon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038871937","display_name":"Brendan Murphy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Murphy, Brendan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111354806","display_name":"Will Cai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Will","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107783894","display_name":"David Khachaturov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khachaturov, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067087948","display_name":"Adam Gleave","orcid":"https://orcid.org/0000-0002-3467-528X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gleave, Adam","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5057950507","display_name":"Kellin Pelrine","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pelrine, Kellin","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":78},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.521,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.521,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.5171,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scaling-law","display_name":"Scaling law","score":0.47580844}],"concepts":[{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.499655},{"id":"https://openalex.org/C2988430800","wikidata":"https://www.wikidata.org/wiki/Q428971","display_name":"Scaling law","level":3,"score":0.47580844},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.38018304},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.30708706},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.121974766},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.02946","pdf_url":"http://arxiv.org/pdf/2408.02946","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.02946","pdf_url":"http://arxiv.org/pdf/2408.02946","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4298190863","https://openalex.org/W3104909087","https://openalex.org/W2952002823","https://openalex.org/W2597205018","https://openalex.org/W2554072523","https://openalex.org/W2518229301","https://openalex.org/W2512421151","https://openalex.org/W2117748264","https://openalex.org/W2013329450","https://openalex.org/W1671671741"],"abstract_inverted_index":{"Recent":[0],"work":[1],"shows":[2],"that":[3,127],"LLMs":[4,108,129,141],"are":[5,13,130],"vulnerable":[6],"to":[7,25,31,43,56,119],"data":[8,22,62,84,91,95,103,145,156],"poisoning,":[9],"in":[10,158],"which":[11,83,117],"they":[12],"trained":[14],"on":[15,105,114],"partially":[16],"corrupted":[17],"or":[18,70],"harmful":[19,34,134],"data.":[20],"Poisoned":[21],"is":[23,54,73],"hard":[24],"detect,":[26],"breaks":[27],"guardrails,":[28],"and":[29,33,45,49,93],"leads":[30],"undesirable":[32],"behavior.":[35],"Given":[36],"the":[37,59,100,150],"intense":[38],"efforts":[39],"by":[40,68,82],"leading":[41],"labs":[42],"train":[44],"deploy":[46],"increasingly":[47,131],"larger":[48,128,159],"more":[50,137],"capable":[51],"LLMs,":[52],"it":[53,72],"critical":[55],"ask":[57],"if":[58,71],"risk":[60],"of":[61,102,121],"poisoning":[63,85,104,157],"will":[64],"be":[65],"naturally":[66],"mitigated":[67],"scale,":[69],"an":[74],"increasing":[75],"threat.":[76],"We":[77,125],"consider":[78],"three":[79,115],"threat":[80,123],"models":[81],"can":[86],"occur:":[87],"malicious":[88],"fine-tuning,":[89],"imperfect":[90],"curation,":[92],"intentional":[94],"contamination.":[96],"Our":[97],"experiments":[98],"evaluate":[99],"effects":[101],"23":[106],"frontier":[107],"ranging":[109],"from":[110],"1.5-72":[111],"billion":[112],"parameters":[113],"datasets":[116],"speak":[118],"each":[120],"our":[122],"models.":[124],"find":[126],"vulnerable,":[132],"learning":[133],"behavior":[135],"significantly":[136],"quickly":[138],"than":[139],"smaller":[140],"with":[142],"even":[143],"minimal":[144],"poisoning.":[146],"These":[147],"results":[148],"underscore":[149],"need":[151],"for":[152],"robust":[153],"safeguards":[154],"against":[155],"LLMs.":[160]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4403159732","counts_by_year":[],"updated_date":"2025-04-03T23:46:41.548906","created_date":"2024-10-06"}