{"id":"https://openalex.org/W4403749441","doi":"https://doi.org/10.48550/arxiv.2407.12019","title":"DIM: Dynamic Integration of Multimodal Entity Linking with Large\n Language Model","display_name":"DIM: Dynamic Integration of Multimodal Entity Linking with Large\n Language Model","publication_year":2024,"publication_date":"2024-06-27","ids":{"openalex":"https://openalex.org/W4403749441","doi":"https://doi.org/10.48550/arxiv.2407.12019"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.12019","pdf_url":"http://arxiv.org/pdf/2407.12019","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2407.12019","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010069764","display_name":"Shezheng Song","orcid":"https://orcid.org/0009-0007-9985-7619"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Shezheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023621058","display_name":"Shasha Li","orcid":"https://orcid.org/0000-0002-7581-1612"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Shasha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100693464","display_name":"Jie Yu","orcid":"https://orcid.org/0000-0002-1649-4020"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Jie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089008240","display_name":"Shan Zhao","orcid":"https://orcid.org/0000-0003-4503-8259"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Shan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101984096","display_name":"Xiao Peng Li","orcid":"https://orcid.org/0000-0002-5448-7219"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xiaopeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020663450","display_name":"Jun Ma","orcid":"https://orcid.org/0000-0002-4195-7760"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100374791","display_name":"Xiaodong Liu","orcid":"https://orcid.org/0000-0002-6879-990X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiaodong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100448048","display_name":"Zhuo Li","orcid":"https://orcid.org/0000-0003-4554-6018"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zhuo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5080183182","display_name":"Xiaoguang Mao","orcid":"https://orcid.org/0000-0003-4204-7424"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mao, Xiaoguang","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":77},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9409,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9409,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5547454},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.46532485},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42024174},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.13074827}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.12019","pdf_url":"http://arxiv.org/pdf/2407.12019","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.12019","pdf_url":"http://arxiv.org/pdf/2407.12019","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4396701345","https://openalex.org/W4396696052","https://openalex.org/W4391913857","https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2001405890"],"abstract_inverted_index":{"Our":[0],"study":[1],"delves":[2],"into":[3],"Multimodal":[4,55],"Entity":[5],"Linking,":[6],"aligning":[7],"the":[8,62,65,84,98,114,120,129],"mention":[9],"in":[10,15,83],"multimodal":[11],"information":[12,31,56,79],"with":[13,57,97],"entities":[14,44,82],"knowledge":[16,58],"base.":[17],"Existing":[18],"methods":[19,118],"are":[20,143],"still":[21],"facing":[22],"challenges":[23],"like":[24],"ambiguous":[25],"entity":[26,37,92,100],"representations":[27,101],"and":[28,45,94,124,140],"limited":[29],"image":[30],"utilization.":[32],"Thus,":[33],"we":[34],"propose":[35,50],"dynamic":[36,99],"extraction":[38,90],"using":[39],"ChatGPT,":[40],"which":[41,86],"dynamically":[42,130],"extracts":[43,78],"enhances":[46],"datasets.":[47],"We":[48],"also":[49],"a":[51],"method:":[52],"Dynamically":[53],"Integrate":[54],"base":[59],"(DIM),":[60],"employing":[61],"capability":[63],"of":[64,91,116],"Large":[66],"Language":[67],"Model":[68],"(LLM)":[69],"for":[70],"visual":[71],"understanding.":[72],"The":[73,105],"LLM,":[74],"such":[75],"as":[76],"BLIP-2,":[77],"relevant":[80],"to":[81],"image,":[85],"can":[87],"facilitate":[88],"improved":[89],"features":[93],"linking":[95],"them":[96],"provided":[102],"by":[103],"ChatGPT.":[104],"experiments":[106],"demonstrate":[107],"that":[108],"our":[109,138],"proposed":[110],"DIM":[111],"method":[112],"outperforms":[113],"majority":[115],"existing":[117],"on":[119,128,145],"three":[121],"original":[122],"datasets,":[123],"achieves":[125],"state-of-the-art":[126],"(SOTA)":[127],"enhanced":[131],"datasets":[132,142],"(Wiki+,":[133],"Rich+,":[134],"Diverse+).":[135],"For":[136],"reproducibility,":[137],"code":[139],"collected":[141],"released":[144],"\\url{https://github.com/season1blue/DIM}.":[146]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4403749441","counts_by_year":[],"updated_date":"2025-04-22T23:56:49.683135","created_date":"2024-10-25"}