{"id":"https://openalex.org/W4406022780","doi":"https://doi.org/10.48550/arxiv.2408.07852","title":"Training Language Models on the Knowledge Graph: Insights on\n Hallucinations and Their Detectability","display_name":"Training Language Models on the Knowledge Graph: Insights on\n Hallucinations and Their Detectability","publication_year":2024,"publication_date":"2024-08-14","ids":{"openalex":"https://openalex.org/W4406022780","doi":"https://doi.org/10.48550/arxiv.2408.07852"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.07852","pdf_url":"http://arxiv.org/pdf/2408.07852","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2408.07852","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081096634","display_name":"Jiri Hron","orcid":"https://orcid.org/0009-0001-3456-7588"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hron, Jiri","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108136269","display_name":"Laura Culp","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Culp, Laura","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043002930","display_name":"Gamaleldin F. Elsayed","orcid":"https://orcid.org/0000-0002-4676-4220"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Elsayed, Gamaleldin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022287663","display_name":"Rosanne Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Rosanne","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048167471","display_name":"Ben Adlam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Adlam, Ben","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076745446","display_name":"Maxwell L. Bileschi","orcid":"https://orcid.org/0000-0001-6771-0590"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bileschi, Maxwell","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066427994","display_name":"Bernd Bohnet","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bohnet, Bernd","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093272099","display_name":"JD Co-Reyes","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Co-Reyes, JD","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087591662","display_name":"Noah Fiedel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fiedel, Noah","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012702521","display_name":"C. Daniel Freeman","orcid":"https://orcid.org/0000-0003-2258-2905"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Freeman, C. Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048764935","display_name":"\u0130zzeddin G\u00fcr","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gur, Izzeddin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009962014","display_name":"Kathleen Kenealy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kenealy, Kathleen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100420185","display_name":"Jaehoon Lee","orcid":"https://orcid.org/0000-0002-3131-5588"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Jaehoon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049860480","display_name":"Peter J. Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Peter J.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085443636","display_name":"Gaurav Mishra","orcid":"https://orcid.org/0000-0002-3254-8797"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mishra, Gaurav","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014193325","display_name":"Igor Mordatch","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mordatch, Igor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053888839","display_name":"Azade Nova","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nova, Azade","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059899470","display_name":"Roman Novak","orcid":"https://orcid.org/0000-0001-5757-6703"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Novak, Roman","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113069812","display_name":"Aaron Parisi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parisi, Aaron","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010225522","display_name":"Jeffrey Pennington","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pennington, Jeffrey","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093272100","display_name":"Alex Rizkowsky","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rizkowsky, Alex","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082545089","display_name":"Isabelle Simpson","orcid":"https://orcid.org/0000-0001-5654-0792"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Simpson, Isabelle","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045805879","display_name":"Hanie Sedghi","orcid":"https://orcid.org/0000-0002-7163-5009"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sedghi, Hanie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064986566","display_name":"Jascha Sohl\u2010Dickstein","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sohl-dickstein, Jascha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026208886","display_name":"Kevin Swersky","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Swersky, Kevin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045680105","display_name":"Sharad Vikram","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vikram, Sharad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093219820","display_name":"Tris Warkentin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Warkentin, Tris","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113791670","display_name":"Lechao Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Lechao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060717631","display_name":"Kelvin Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Kelvin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112347601","display_name":"Jasper Snoek","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Snoek, Jasper","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5042760897","display_name":"Simon Kornblith","orcid":"https://orcid.org/0000-0002-9088-2443"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kornblith, Simon","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":77},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.9257,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.9257,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/knowledge-graph","display_name":"Knowledge graph","score":0.5341465}],"concepts":[{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.5341465},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.517213},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.48535338},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4585734},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38002416},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34541053},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.34367275},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.19805944}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.07852","pdf_url":"http://arxiv.org/pdf/2408.07852","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.07852","pdf_url":"http://arxiv.org/pdf/2408.07852","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4387849428","https://openalex.org/W4376623224","https://openalex.org/W4312825515","https://openalex.org/W4306742369","https://openalex.org/W4303457083","https://openalex.org/W3204019825","https://openalex.org/W3188962172","https://openalex.org/W2951359407","https://openalex.org/W2772917594","https://openalex.org/W2131146434"],"abstract_inverted_index":{"While":[0,133],"many":[1,26],"capabilities":[2],"of":[3,14,74,95,102,110,152,158],"language":[4],"models":[5],"(LMs)":[6],"improve":[7],"with":[8],"increased":[9],"training":[10,51,57,97],"budget,":[11],"the":[12,50,56,96,150,153,156],"influence":[13],"scale":[15,151],"on":[16,38,93,131,140],"hallucinations":[17,42],"is":[18,30],"not":[19],"yet":[20],"fully":[21,54],"understood.":[22],"Hallucinations":[23],"come":[24],"in":[25,49],"forms,":[27],"and":[28,67,86,106,155],"there":[29],"no":[31],"universally":[32],"accepted":[33],"definition.":[34],"We":[35,78],"thus":[36,107],"focus":[37],"studying":[39],"only":[40],"those":[41],"where":[43],"a":[44,62,72,82],"correct":[45],"answer":[46],"appears":[47],"verbatim":[48],"set.":[52],"To":[53],"control":[55],"data":[58,98],"content,":[59],"we":[60,125,134,144],"construct":[61],"knowledge":[63],"graph":[64],"(KG)-based":[65],"dataset,":[66,84],"use":[68],"it":[69],"to":[70],"train":[71],"set":[73],"increasingly":[75],"large":[76],"LMs.":[77],"find":[79,145],"that":[80],"for":[81],"fixed":[83,141],"larger":[85,104],"longer-trained":[87],"LMs":[88],"hallucinate":[89],"less.":[90],"However,":[91],"hallucinating":[92],"$\\leq5$%":[94],"requires":[99],"an":[100,108,146],"order":[101,109],"magnitude":[103,111],"model,":[105],"more":[112],"compute,":[113],"than":[114],"Hoffmann":[115],"et":[116],"al.":[117],"(2022)":[118],"reported":[119],"was":[120],"optimal.":[121],"Given":[122],"this":[123],"costliness,":[124],"study":[126],"how":[127],"hallucination":[128],"detectors":[129],"depend":[130],"scale.":[132],"see":[135],"detector":[136],"size":[137],"improves":[138],"performance":[139],"LM's":[142],"outputs,":[143],"inverse":[147],"relationship":[148],"between":[149],"LM":[154],"detectability":[157],"its":[159],"hallucinations.":[160]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4406022780","counts_by_year":[],"updated_date":"2025-04-18T04:24:42.105395","created_date":"2025-01-03"}