{"id":"https://openalex.org/W4392539635","doi":"https://doi.org/10.48550/arxiv.2403.02626","title":"Modeling Collaborator: Enabling Subjective Vision Classification With\n Minimal Human Effort via LLM Tool-Use","display_name":"Modeling Collaborator: Enabling Subjective Vision Classification With\n Minimal Human Effort via LLM Tool-Use","publication_year":2024,"publication_date":"2024-03-04","ids":{"openalex":"https://openalex.org/W4392539635","doi":"https://doi.org/10.48550/arxiv.2403.02626"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2403.02626","pdf_url":"https://arxiv.org/pdf/2403.02626","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2403.02626","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006780186","display_name":"Imad Eddine Toubal","orcid":"https://orcid.org/0000-0003-1754-0823"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Toubal, Imad Eddine","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064895220","display_name":"Aditya Avinash","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Avinash, Aditya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063596836","display_name":"Neil Alldrin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alldrin, Neil Gordon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032570936","display_name":"Jan Dlabal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dlabal, Jan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058224708","display_name":"Wenlei Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Wenlei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009947623","display_name":"Enming Luo","orcid":"https://orcid.org/0000-0002-6887-1094"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Enming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080565982","display_name":"Otilia Stretcu","orcid":"https://orcid.org/0000-0001-7141-2916"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stretcu, Otilia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100604457","display_name":"Hao Xiong","orcid":"https://orcid.org/0000-0002-7619-4740"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiong, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024393012","display_name":"Chun-Ta Lu","orcid":"https://orcid.org/0000-0001-8573-4975"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Chun-Ta","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056352820","display_name":"Howard Zhou","orcid":"https://orcid.org/0000-0003-3245-8481"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Howard","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032451496","display_name":"Ranjay Krishna","orcid":"https://orcid.org/0000-0001-8784-2531"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Krishna, Ranjay","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017633018","display_name":"Ariel Fuxman","orcid":"https://orcid.org/0009-0003-6760-997X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fuxman, Ariel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5032382472","display_name":"Tom Duerig","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Duerig, Tom","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":77},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.8961,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.8961,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5582054},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43147844},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.34702194}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2403.02626","pdf_url":"https://arxiv.org/pdf/2403.02626","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2403.02626","pdf_url":"https://arxiv.org/pdf/2403.02626","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391913857","https://openalex.org/W2748952813","https://openalex.org/W2530322880","https://openalex.org/W2478288626","https://openalex.org/W2390279801","https://openalex.org/W2382290278","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2350741829","https://openalex.org/W2001405890"],"abstract_inverted_index":{"From":[0],"content":[1],"moderation":[2],"to":[3,13,39,65,77,110,123,146],"wildlife":[4],"conservation,":[5],"the":[6,106,149,166],"number":[7],"of":[8,58,71,117],"applications":[9],"that":[10,93,179],"require":[11],"models":[12,142,178,198,209,218],"recognize":[14],"nuanced":[15],"or":[16,36,69],"subjective":[17,187],"visual":[18,216],"concepts":[19,27,188],"is":[20],"growing.":[21],"Traditionally,":[22],"developing":[23],"classifiers":[24],"for":[25,45,168],"such":[26],"requires":[28],"substantial":[29],"manual":[30,95],"effort":[31,96,108],"measured":[32],"in":[33,136,182],"hours,":[34],"days,":[35],"even":[37],"months":[38],"identify":[40],"and":[41,143,154,189,214],"annotate":[42],"data":[43,74,159],"needed":[44],"training.":[46],"Even":[47],"with":[48,101],"recently":[49],"proposed":[50],"Agile":[51,201],"Modeling":[52,202],"techniques,":[53],"which":[54],"enable":[55],"rapid":[56],"bootstrapping":[57],"image":[59,193],"classifiers,":[60],"users":[61],"are":[62,180],"still":[63],"required":[64,109],"spend":[66],"30":[67],"minutes":[68],"more":[70],"monotonous,":[72],"repetitive":[73],"labeling":[75,100,120,157],"just":[76],"train":[78],"a":[79,90,112],"single":[80],"classifier.":[81],"Drawing":[82],"on":[83],"Fiske's":[84],"Cognitive":[85],"Miser":[86],"theory,":[87],"we":[88],"propose":[89],"new":[91],"framework":[92,132,164,173],"alleviates":[94],"by":[97,114,155],"replacing":[98],"human":[99],"natural":[102,128],"language":[103,129,141],"interactions,":[104],"reducing":[105],"total":[107],"define":[111],"concept":[113,150],"an":[115],"order":[116],"magnitude:":[118],"from":[119],"2,000":[121],"images":[122],"only":[124],"100":[125],"plus":[126],"some":[127],"interactions.":[130],"Our":[131],"leverages":[133],"recent":[134],"advances":[135],"foundation":[137],"models,":[138,145],"both":[139],"large":[140,215],"vision-language":[144],"carve":[147],"out":[148],"space":[151],"through":[152],"conversation":[153],"automatically":[156],"training":[158],"points.":[160],"Most":[161],"importantly,":[162],"our":[163,172,196],"eliminates":[165],"need":[167],"crowd-sourced":[169],"annotations.":[170],"Moreover,":[171],"ultimately":[174],"produces":[175],"lightweight":[176],"classification":[177,194,208],"deployable":[181],"cost-sensitive":[183],"scenarios.":[184],"Across":[185],"15":[186],"across":[190],"2":[191],"public":[192],"datasets,":[195],"trained":[197],"outperform":[199],"traditional":[200],"as":[203,205],"well":[204],"state-of-the-art":[206],"zero-shot":[207],"like":[210,219],"ALIGN,":[211],"CLIP,":[212],"CuPL,":[213],"question-answering":[217],"PaLI-X.":[220]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4392539635","counts_by_year":[],"updated_date":"2025-04-21T15:45:02.729492","created_date":"2024-03-07"}