{"id":"https://openalex.org/W4403746914","doi":"https://doi.org/10.48550/arxiv.2409.08240","title":"IFAdapter: Instance Feature Control for Grounded Text-to-Image\n Generation","display_name":"IFAdapter: Instance Feature Control for Grounded Text-to-Image\n Generation","publication_year":2024,"publication_date":"2024-09-12","ids":{"openalex":"https://openalex.org/W4403746914","doi":"https://doi.org/10.48550/arxiv.2409.08240"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.08240","pdf_url":"http://arxiv.org/pdf/2409.08240","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2409.08240","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054606413","display_name":"Yinwei Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Yinwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039357854","display_name":"Xianpan Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Xianpan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101733866","display_name":"Bing Ma","orcid":"https://orcid.org/0000-0003-0993-5403"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Bing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024940688","display_name":"Xuefeng Su","orcid":"https://orcid.org/0000-0002-8954-4412"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Xuefeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103172392","display_name":"Kai Ma","orcid":"https://orcid.org/0000-0003-1810-6658"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Kai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5015574447","display_name":"Xinchao Wang","orcid":"https://orcid.org/0000-0003-0057-1404"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xinchao","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":82},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9231,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9231,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9214,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6240725}],"concepts":[{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6240725},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5236435},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.46886283},{"id":"https://openalex.org/C156325361","wikidata":"https://www.wikidata.org/wiki/Q1152864","display_name":"Grounded theory","level":3,"score":0.46821192},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.44297886},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4260639},{"id":"https://openalex.org/C190248442","wikidata":"https://www.wikidata.org/wiki/Q839486","display_name":"Qualitative research","level":2,"score":0.16681334},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.15076864},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.14524978},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.090826154},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.05049786}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.08240","pdf_url":"http://arxiv.org/pdf/2409.08240","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.08240","pdf_url":"http://arxiv.org/pdf/2409.08240","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4396854307","https://openalex.org/W4361008414","https://openalex.org/W3040823075","https://openalex.org/W2620765995","https://openalex.org/W2092147963","https://openalex.org/W2054080977","https://openalex.org/W2015439768","https://openalex.org/W1546533203","https://openalex.org/W1535784397","https://openalex.org/W1511554945"],"abstract_inverted_index":{"While":[0],"Text-to-Image":[1],"(T2I)":[2],"diffusion":[3,118],"models":[4,163],"excel":[5],"at":[6],"generating":[7,52],"visually":[8],"appealing":[9],"images":[10],"of":[11,24],"individual":[12],"instances,":[13],"they":[14],"struggle":[15],"to":[16,33,68,107,127,143,148],"accurately":[17],"position":[18],"and":[19,73,101,138,154,167],"control":[20,44],"the":[21,35,60,81,86,117],"features":[22,110],"generation":[23],"multiple":[25],"instances.":[26,78],"The":[27,91,114],"Layout-to-Image":[28],"(L2I)":[29],"task":[30],"was":[31],"introduced":[32],"address":[34,80],"positioning":[36,153],"challenges":[37],"by":[38,96],"incorporating":[39,97],"bounding":[40],"boxes":[41],"as":[42,120],"spatial":[43,112],"signals,":[45],"but":[46],"it":[47,125],"still":[48],"falls":[49],"short":[50],"in":[51,76,164],"precise":[53],"instance":[54],"features.":[55,155],"In":[56],"response,":[57],"we":[58,84,133],"propose":[59],"Instance":[61,87,104],"Feature":[62,88],"Generation":[63],"(IFG)":[64],"task,":[65,83],"which":[66],"aims":[67],"ensure":[69],"both":[70,165],"positional":[71],"accuracy":[72],"feature":[74,94],"fidelity":[75],"generated":[77],"To":[79],"IFG":[82,136],"introduce":[85],"Adapter":[89],"(IFAdapter).":[90],"IFAdapter":[92,115,160],"enhances":[93],"depiction":[95],"additional":[98],"appearance":[99],"tokens":[100],"utilizing":[102],"an":[103,135],"Semantic":[105],"Map":[106],"align":[108],"instance-level":[109],"with":[111,151],"locations.":[113],"guides":[116],"process":[119],"a":[121,140],"plug-and-play":[122],"module,":[123],"making":[124],"adaptable":[126],"various":[128],"community":[129],"models.":[130],"For":[131],"evaluation,":[132],"contribute":[134],"benchmark":[137],"develop":[139],"verification":[141],"pipeline":[142],"objectively":[144],"compare":[145],"models'":[146],"abilities":[147],"generate":[149],"instances":[150],"accurate":[152],"Experimental":[156],"results":[157],"demonstrate":[158],"that":[159],"outperforms":[161],"other":[162],"quantitative":[166],"qualitative":[168],"evaluations.":[169]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4403746914","counts_by_year":[],"updated_date":"2025-01-21T06:18:20.998816","created_date":"2024-10-25"}