{"id":"https://openalex.org/W4394906915","doi":"https://doi.org/10.48550/arxiv.2404.09836","title":"How Far Have We Gone in Stripped Binary Code Understanding Using Large\n Language Models","display_name":"How Far Have We Gone in Stripped Binary Code Understanding Using Large\n Language Models","publication_year":2024,"publication_date":"2024-04-15","ids":{"openalex":"https://openalex.org/W4394906915","doi":"https://doi.org/10.48550/arxiv.2404.09836"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.09836","pdf_url":"http://arxiv.org/pdf/2404.09836","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2404.09836","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038253295","display_name":"Xiuwei Shang","orcid":"https://orcid.org/0009-0009-6660-9947"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shang, Xiuwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085001934","display_name":"Shaoyin Cheng","orcid":"https://orcid.org/0000-0002-3992-9509"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Shaoyin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050913370","display_name":"G. Chen","orcid":"https://orcid.org/0000-0001-8555-9935"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Guoqiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050572140","display_name":"Yanming Zhang","orcid":"https://orcid.org/0000-0001-6138-6080"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yanming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103452489","display_name":"Li Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113033524","display_name":"Xiao Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Xiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101338646","display_name":"Gangyang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Gangyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067689180","display_name":"Weiming Zhang","orcid":"https://orcid.org/0000-0001-5576-6108"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Weiming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5064573190","display_name":"Nenghai Yu","orcid":"https://orcid.org/0000-0003-4417-9316"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Nenghai","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":77},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9892,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9892,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9462,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9399,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6057432}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6310629},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6057432},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.58787745},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.5024977},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.17158979},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15060663},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.08622268}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.09836","pdf_url":"http://arxiv.org/pdf/2404.09836","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.09836","pdf_url":"http://arxiv.org/pdf/2404.09836","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391913857","https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2530322880","https://openalex.org/W2390279801","https://openalex.org/W2382290278","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2350741829","https://openalex.org/W2001405890"],"abstract_inverted_index":{"Binary":[0],"code":[1,30,80,100,115,141,150,179,190,207],"analysis":[2],"plays":[3],"a":[4,122,181],"pivotal":[5],"role":[6],"in":[7,52,75,113,130,201],"various":[8],"software":[9,14,18],"security":[10],"applications,":[11],"such":[12,98],"as":[13,99],"maintenance,":[15],"malware":[16],"detection,":[17],"vulnerability":[19],"discovery,":[20],"patch":[21],"analysis,":[22],"etc.":[23],"However,":[24],"unlike":[25],"source":[26],"code,":[27],"understanding":[28,101,142],"binary":[29,54,79,114,140,149,178,189,206],"is":[31],"challenging":[32],"for":[33,96],"reverse":[34,132],"engineers":[35],"due":[36],"to":[37,48,78,124,180],"the":[38,93,109,126,186,195,199,203],"absence":[39],"of":[40,61,111,128,164,188,198,205],"semantic":[41],"information.":[42],"Therefore,":[43],"automated":[44],"tools":[45],"are":[46],"needed":[47],"assist":[49],"human":[50],"players":[51],"interpreting":[53],"code.":[55],"In":[56,117],"recent":[57],"years,":[58],"two":[59,138],"groups":[60],"technologies":[62,70],"have":[63,71,88],"shown":[64],"promising":[65],"prospects:":[66],"(1)":[67],"Deep":[68],"learning-based":[69],"demonstrated":[72],"competitive":[73],"results":[74,193],"tasks":[76,97],"related":[77],"understanding,":[81],"furthermore,":[82],"(2)":[83],"Large":[84],"Language":[85],"Models":[86],"(LLMs)":[87],"been":[89],"extensively":[90],"pre-trained":[91],"at":[92],"source-code":[94],"level":[95],"and":[102,148,159],"generation.":[103],"This":[104],"makes":[105],"participants":[106],"wonder":[107],"about":[108],"ability":[110],"LLMs":[112,129,166,175,200],"understanding.":[116,208],"this":[118],"work,":[119],"we":[120],"propose":[121],"benchmark":[123,136],"evaluate":[125],"effectiveness":[127],"real-world":[131],"engineering":[133],"scenarios.":[134],"The":[135],"covers":[137],"key":[139],"tasks,":[143],"including":[144],"function":[145],"name":[146],"recovery":[147],"summarization.":[151],"We":[152],"gain":[153],"valuable":[154],"insights":[155],"into":[156],"their":[157],"capabilities":[158],"limitations":[160],"through":[161],"extensive":[162],"evaluations":[163,171],"popular":[165],"using":[167],"our":[168],"benchmark.":[169],"Our":[170,192],"reveal":[172],"that":[173],"existing":[174],"can":[176],"understand":[177],"certain":[182],"extent,":[183],"thereby":[184],"improving":[185],"efficiency":[187],"analysis.":[191],"highlight":[194],"great":[196],"potential":[197],"advancing":[202],"field":[204]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4394906915","counts_by_year":[],"updated_date":"2025-04-20T00:31:16.660095","created_date":"2024-04-18"}