{"id":"https://openalex.org/W4393939825","doi":"https://doi.org/10.48550/arxiv.2404.01959","title":"Bi-LORA: A Vision-Language Approach for Synthetic Image Detection","display_name":"Bi-LORA: A Vision-Language Approach for Synthetic Image Detection","publication_year":2024,"publication_date":"2024-04-02","ids":{"openalex":"https://openalex.org/W4393939825","doi":"https://doi.org/10.48550/arxiv.2404.01959"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.01959","pdf_url":"http://arxiv.org/pdf/2404.01959","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2404.01959","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031314564","display_name":"Mamadou Ke\u00efta","orcid":"https://orcid.org/0009-0009-7618-9253"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Keita, Mamadou","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114039161","display_name":"Wassim Hamidouche","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hamidouche, Wassim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094583687","display_name":"Hessen Bougueffa Eutamene","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eutamene, Hessen Bougueffa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013928164","display_name":"Abdenour Hadid","orcid":"https://orcid.org/0000-0001-9092-735X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hadid, Abdenour","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5114889285","display_name":"Abdelmalik Taleb-Ahmed","orcid":"https://orcid.org/0000-0001-6034-7290"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taleb-Ahmed, Abdelmalik","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.915412,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":77,"max":88},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9352,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9352,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9007,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.60664386},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5367002},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5191821},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49187493}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.01959","pdf_url":"http://arxiv.org/pdf/2404.01959","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.01959","pdf_url":"http://arxiv.org/pdf/2404.01959","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3116076068","https://openalex.org/W2951359407","https://openalex.org/W2775347418","https://openalex.org/W2772917594","https://openalex.org/W2755342338","https://openalex.org/W2229312674","https://openalex.org/W2166024367","https://openalex.org/W2079911747","https://openalex.org/W2058170566","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Advancements":[0],"in":[1,18,43,106,147,179],"deep":[2],"image":[3,96,116,129,181],"synthesis":[4],"techniques,":[5,89],"such":[6],"as":[7,114],"generative":[8,155],"adversarial":[9],"networks":[10],"(GANs)":[11],"and":[12,62,133,163,189],"diffusion":[13],"models":[14,71,156,190],"(DMs),":[15],"have":[16],"ushered":[17],"an":[19,75,115,173],"era":[20],"of":[21,69,94,123,142,177],"generating":[22],"highly":[23],"realistic":[24],"images.":[25,101],"While":[26],"this":[27,193],"technological":[28],"progress":[29],"has":[30,35],"captured":[31],"significant":[32],"interest,":[33],"it":[34],"also":[36],"raised":[37],"concerns":[38],"about":[39],"the":[40,56,66,92,120,140],"potential":[41],"difficulty":[42],"distinguishing":[44],"real":[45],"images":[46,151],"from":[47,55,152],"their":[48],"synthetic":[49,95,180],"counterparts.":[50],"This":[51],"paper":[52],"takes":[53],"inspiration":[54],"potent":[57],"convergence":[58],"capabilities":[59,122,166],"between":[60],"vision":[61],"language,":[63],"coupled":[64],"with":[65,84,192],"zero-shot":[67],"nature":[68],"vision-language":[70],"(VLMs).":[72],"We":[73],"introduce":[74],"innovative":[76],"method":[77],"called":[78],"Bi-LORA":[79],"that":[80],"leverages":[81],"VLMs,":[82],"combined":[83],"low-rank":[85],"adaptation":[86],"(LORA)":[87],"tuning":[88],"to":[90,138,161,167],"enhance":[91],"precision":[93],"detection":[97,182],"for":[98],"unseen":[99,149,184],"model-generated":[100],"The":[102,169,187],"pivotal":[103],"conceptual":[104],"shift":[105],"our":[107,143],"methodology":[108],"revolves":[109],"around":[110],"reframing":[111],"binary":[112],"classification":[113],"captioning":[117],"task,":[118],"leveraging":[119],"distinctive":[121],"cutting-edge":[124],"VLM,":[125],"notably":[126],"bootstrapping":[127],"language":[128],"pre-training":[130],"(BLIP2).":[131],"Rigorous":[132],"comprehensive":[134],"experiments":[135],"are":[136],"conducted":[137],"validate":[139],"effectiveness":[141],"proposed":[144],"approach,":[145],"particularly":[146],"detecting":[148],"diffusion-generated":[150],"unknown":[153],"diffusion-based":[154],"during":[157],"training,":[158],"showcasing":[159],"robustness":[160],"noise,":[162],"demonstrating":[164],"generalization":[165],"GANs.":[168],"obtained":[170],"results":[171],"showcase":[172],"impressive":[174],"average":[175],"accuracy":[176],"93.41%":[178],"on":[183],"generation":[185],"models.":[186],"code":[188],"associated":[191],"research":[194],"can":[195],"be":[196],"publicly":[197],"accessed":[198],"at":[199],"https://github.com/Mamadou-Keita/VLM-DETECT.":[200]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4393939825","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-04-19T17:39:09.387069","created_date":"2024-04-05"}