{"id":"https://openalex.org/W4387946871","doi":"https://doi.org/10.48550/arxiv.2310.14724","title":"A Survey on LLM-generated Text Detection: Necessity, Methods, and Future Directions","display_name":"A Survey on LLM-generated Text Detection: Necessity, Methods, and Future Directions","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4387946871","doi":"https://doi.org/10.48550/arxiv.2310.14724"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2310.14724","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2310.14724","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036827870","display_name":"Junchao Wu","orcid":"https://orcid.org/0000-0001-5044-3019"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Junchao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114139283","display_name":"Shu Yang","orcid":"https://orcid.org/0000-0001-9226-2945"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Shu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085246256","display_name":"Runzhe Zhan","orcid":"https://orcid.org/0000-0002-3175-6885"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhan, Runzhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100299978","display_name":"Yulin Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Yulin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101468579","display_name":"Derek F. Wong","orcid":"https://orcid.org/0000-0002-5307-7322"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wong, Derek F.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5025832925","display_name":"Lidia S. Chao","orcid":"https://orcid.org/0000-0001-6629-170X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chao, Lidia S.","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.999953,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9886,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9886,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9407,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.937,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5132499},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.5059108},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.47292334},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.42485213},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32335904},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2310.14724","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2310.14724","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2310.14724","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"score":0.75,"display_name":"Quality education","id":"https://metadata.un.org/sdg/4"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W4297672492","https://openalex.org/W4246396837","https://openalex.org/W3191453585","https://openalex.org/W3176240006","https://openalex.org/W3126451824","https://openalex.org/W2748952813","https://openalex.org/W2502115930","https://openalex.org/W2482350142","https://openalex.org/W1561927205"],"abstract_inverted_index":{"The":[0,78,102,233],"powerful":[1],"ability":[2],"to":[3,39,46,57,83,146,194,209],"understand,":[4],"follow,":[5],"and":[6,30,63,69,127,141,159,179,213],"generate":[7],"complex":[8],"language":[9,13],"emerging":[10],"from":[11,72],"large":[12],"models":[14],"(LLMs)":[15],"makes":[16],"LLM-generated":[17,52,76,79,166,191,230],"text":[18,80,89,167,192,231],"flood":[19],"many":[20],"areas":[21],"of":[22,61,75,88,198,229],"our":[23],"daily":[24],"lives":[25],"at":[26],"an":[27,43,93],"incredible":[28],"speed":[29],"is":[31,42,55,96,208],"widely":[32],"accepted":[33],"by":[34,92,111],"humans.":[35],"As":[36],"LLMs":[37,62,124],"continue":[38],"expand,":[40],"there":[41],"imperative":[44],"need":[45,145],"develop":[47],"detectors":[48],"that":[49],"can":[50],"detect":[51],"text.":[53],"This":[54],"crucial":[56],"mitigate":[58],"potential":[59,177],"misuse":[60],"safeguard":[64],"realms":[65],"like":[66,174],"artistic":[67],"expression":[68],"social":[70],"networks":[71],"harmful":[73],"influence":[74],"content.":[77],"detection":[81,168,193],"aims":[82],"discern":[84],"if":[85],"a":[86,98,211,223],"piece":[87],"was":[90],"produced":[91],"LLM,":[94],"which":[95],"essentially":[97],"binary":[99],"classification":[100],"task.":[101],"detector":[103,148],"techniques":[104],"have":[105],"witnessed":[106],"notable":[107],"advancements":[108],"recently,":[109],"propelled":[110],"innovations":[112],"in":[113,138,190,226],"watermarking":[114],"techniques,":[115],"zero-shot":[116],"methods,":[117,120,123],"fine-turning":[118],"LMs":[119],"adversarial":[121],"learning":[122],"as":[125],"detectors,":[126],"human-assisted":[128],"methods.":[129],"In":[130],"this":[131,139,206],"survey,":[132],"we":[133,163,183],"collate":[134],"recent":[135],"research":[136,189],"breakthroughs":[137],"area":[140],"underscore":[142],"the":[143,196,227],"pressing":[144],"bolster":[147],"research.":[149],"We":[150],"also":[151,219],"delve":[152],"into":[153],"prevalent":[154],"datasets,":[155],"elucidating":[156],"their":[157],"limitations":[158],"developmental":[160],"requirements.":[161],"Furthermore,":[162],"analyze":[164],"various":[165],"paradigms,":[169],"shedding":[170],"light":[171],"on":[172],"challenges":[173],"out-of-distribution":[175],"problems,":[176],"attacks,":[178],"data":[180],"ambiguity.":[181],"Conclusively,":[182],"highlight":[184],"interesting":[185],"directions":[186],"for":[187,216],"future":[188],"advance":[195],"implementation":[197],"responsible":[199],"artificial":[200],"intelligence":[201],"(AI).":[202],"Our":[203],"aim":[204],"with":[205],"survey":[207],"provide":[210],"clear":[212],"comprehensive":[214],"introduction":[215],"newcomers":[217],"while":[218],"offering":[220],"seasoned":[221],"researchers":[222],"valuable":[224],"update":[225],"field":[228],"detection.":[232],"useful":[234],"resources":[235],"are":[236],"publicly":[237],"available":[238],"at:":[239],"https://github.com/NLP2CT/LLM-generated-Text-Detection.":[240]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4387946871","counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":2}],"updated_date":"2025-05-04T13:36:20.592711","created_date":"2023-10-26"}