{"id":"https://openalex.org/W4378499145","doi":"https://doi.org/10.48550/arxiv.2305.15717","title":"The False Promise of Imitating Proprietary LLMs","display_name":"The False Promise of Imitating Proprietary LLMs","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4378499145","doi":"https://doi.org/10.48550/arxiv.2305.15717"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.15717","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2305.15717","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092031203","display_name":"Arnav Gudibande","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gudibande, Arnav","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111226805","display_name":"Eric Wallace","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wallace, Eric","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052858739","display_name":"Charlie Snell","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Snell, Charlie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081645573","display_name":"Xinyang Geng","orcid":"https://orcid.org/0009-0000-5500-6387"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Geng, Xinyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100458789","display_name":"Hao Liu","orcid":"https://orcid.org/0000-0002-1975-1272"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049349154","display_name":"Pieter Abbeel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abbeel, Pieter","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026322200","display_name":"Sergey Levine","orcid":"https://orcid.org/0000-0001-6764-2743"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Levine, Sergey","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5019426968","display_name":"Dawn Song","orcid":"https://orcid.org/0000-0001-9745-6802"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Dawn","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.917444,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9903,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9662,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7086351},{"id":"https://openalex.org/keywords/base","display_name":"Base (topology)","score":0.4470991}],"concepts":[{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.8736774},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7086351},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6901401},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.4470991},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42757738},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.15110019},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.15717","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.15717","pdf_url":"http://arxiv.org/pdf/2305.15717","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2305.15717","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.15717","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W2748952813","https://openalex.org/W1531601525"],"abstract_inverted_index":{"An":[0],"emerging":[1],"method":[2],"to":[3,11,35,135,144,238],"cheaply":[4,36],"improve":[5],"a":[6,17,22,43,58,188,193],"weaker":[7,44],"language":[8],"model":[9,68,185],"is":[10,187,237],"finetune":[12,57],"it":[13],"on":[14,146],"outputs":[15,116],"from":[16,140],"stronger":[18],"model,":[19],"such":[20],"as":[21,117],"proprietary":[23,39,255],"system":[24],"like":[25],"ChatGPT":[26,64,145],"(e.g.,":[27],"Alpaca,":[28],"Self-Instruct,":[29],"and":[30,73,87,111,199],"others).":[31],"This":[32],"approach":[33],"looks":[34],"imitate":[37,63],"the":[38,82,96,138,141,154,229,240,251],"model's":[40],"capabilities":[41,195],"using":[42,65,84,210,219],"open-source":[45,235],"model.":[46],"In":[47,224],"this":[48,53],"work,":[49],"we":[50,92,128,182,226],"critically":[51],"analyze":[52],"approach.":[54],"We":[55,79,157],"first":[56],"series":[59],"of":[60,99,137,214,243,253],"LMs":[61,201],"that":[62,130,148,159,184,228],"varying":[66],"base":[67,142,222,246],"sizes":[69],"(1.5B--13B),":[70],"data":[71,75,216],"sources,":[72],"imitation":[74,101,131,155,169,186,215],"amounts":[76],"(0.3M--150M":[77],"tokens).":[78],"then":[80],"evaluate":[81],"models":[83,102,132,170,236],"crowd":[85,112],"raters":[86,167],"canonical":[88],"NLP":[89],"benchmarks.":[90],"Initially,":[91],"were":[93],"surprised":[94],"by":[95,218],"output":[97],"quality":[98],"our":[100],"--":[103],"they":[104],"appear":[105],"far":[106],"better":[107,245],"at":[108,173],"following":[109],"instructions,":[110],"workers":[113],"rate":[114],"their":[115],"competitive":[118],"with":[119,203],"ChatGPT.":[120],"However,":[121],"when":[122],"conducting":[123],"more":[124,220],"targeted":[125],"automatic":[126],"evaluations,":[127],"find":[129],"close":[133],"little":[134],"none":[136],"gap":[139,196],"LM":[143],"tasks":[147],"are":[149,171],"not":[150,178],"heavily":[151],"supported":[152],"in":[153],"data.":[156],"show":[158],"these":[160],"performance":[161],"discrepancies":[162],"may":[163],"slip":[164],"past":[165],"human":[166],"because":[168],"adept":[172],"mimicking":[174],"ChatGPT's":[175],"style":[176],"but":[177],"its":[179],"factuality.":[180],"Overall,":[181],"conclude":[183],"false":[189],"promise:":[190],"there":[191],"exists":[192],"substantial":[194],"between":[197],"open":[198],"closed":[200],"that,":[202],"current":[204],"methods,":[205],"can":[206],"only":[207],"be":[208],"bridged":[209],"an":[211],"unwieldy":[212],"amount":[213],"or":[217],"capable":[221],"LMs.":[223],"turn,":[225],"argue":[227],"highest":[230],"leverage":[231],"action":[232],"for":[233],"improving":[234],"tackle":[239],"difficult":[241],"challenge":[242],"developing":[244],"LMs,":[247],"rather":[248],"than":[249],"taking":[250],"shortcut":[252],"imitating":[254],"systems.":[256]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4378499145","counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":16},{"year":2023,"cited_by_count":26}],"updated_date":"2025-05-03T05:35:01.259532","created_date":"2023-05-27"}