{"id":"https://openalex.org/W4378174044","doi":"https://doi.org/10.48550/arxiv.2305.13342","title":"On the Limitations of Simulating Active Learning","display_name":"On the Limitations of Simulating Active Learning","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4378174044","doi":"https://doi.org/10.48550/arxiv.2305.13342"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.13342","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2305.13342","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054791689","display_name":"Katerina Margatina","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Margatina, Katerina","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5010341007","display_name":"\u039d\u03b9\u03ba\u03cc\u03bb\u03b1\u03bf\u03c2 \u0391\u03bb\u03ad\u03c4\u03c1\u03b1\u03c2","orcid":"https://orcid.org/0000-0003-4285-1965"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aletras, Nikolaos","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":66},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9951,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/human-in-the-loop","display_name":"Human-in-the-loop","score":0.6000856}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.69648355},{"id":"https://openalex.org/C2780626000","wikidata":"https://www.wikidata.org/wiki/Q5936775","display_name":"Human-in-the-loop","level":2,"score":0.6000856},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5457236},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5383694},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5273203},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5015013},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.47559986},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47251448},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.4222159},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.13342","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.13342","pdf_url":"http://arxiv.org/pdf/2305.13342","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2305.13342","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.13342","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4206195464","https://openalex.org/W3202085196","https://openalex.org/W2625833328","https://openalex.org/W2392921965","https://openalex.org/W2377979023","https://openalex.org/W2361861616","https://openalex.org/W2358755282","https://openalex.org/W2263699433","https://openalex.org/W2228999631","https://openalex.org/W2218034408"],"abstract_inverted_index":{"Active":[0],"learning":[1,136],"(AL)":[2],"is":[3,30,47,169,211],"a":[4,31,156],"human-and-model-in-the-loop":[5],"paradigm":[6],"that":[7,96,120,146],"iteratively":[8],"selects":[9],"informative":[10],"unlabeled":[11,64],"data":[12,194],"for":[13,38,177,206],"human":[14,27],"annotation,":[15],"aiming":[16],"to":[17,44,48,140,160,171,212,215,227],"improve":[18],"over":[19],"random":[20,142],"sampling.":[21],"However,":[22],"performing":[23],"AL":[24,85,103,148,178],"experiments":[25],"with":[26,107],"annotations":[28],"on-the-fly":[29],"laborious":[32],"and":[33,56,75],"expensive":[34],"process,":[35],"thus":[36],"unrealistic":[37],"academic":[39],"research.":[40,104],"An":[41],"easy":[42],"fix":[43],"this":[45,67],"impediment":[46],"simulate":[49],"AL,":[50],"by":[51],"treating":[52],"an":[53,108],"already":[54],"labeled":[55,152],"publicly":[57],"available":[58,151],"dataset":[59],"as":[60,159,181],"the":[61,77,84,93,100,112,126,129,174,187,219,222],"pool":[62],"of":[63,102,110,125,200,224],"data.":[65,165],"In":[66,198],"position":[68],"paper,":[69],"we":[70,202],"first":[71],"survey":[72],"recent":[73],"literature":[74],"highlight":[76],"challenges":[78],"across":[79],"all":[80],"different":[81],"steps":[82],"within":[83,218],"loop.":[86],"We":[87,105,144,166],"further":[88],"unveil":[89],"neglected":[90],"caveats":[91],"in":[92,163,184,221],"experimental":[94],"setup":[95],"can":[97,115],"significantly":[98],"affect":[99],"quality":[101],"continue":[106],"exploration":[109],"how":[111],"simulation":[113],"setting":[114],"govern":[116],"empirical":[117],"findings,":[118],"arguing":[119],"it":[121,168],"might":[122,154],"be":[123],"one":[124],"answers":[127],"behind":[128],"ever":[130],"posed":[131],"question":[132],"``why":[133],"do":[134],"active":[135],"algorithms":[137,149],"sometimes":[138],"fail":[139],"outperform":[141],"sampling?''.":[143],"argue":[145],"evaluating":[147],"on":[150],"datasets":[153],"provide":[155],"lower":[157],"bound":[158],"their":[161],"effectiveness":[162],"real":[164],"believe":[167],"essential":[170],"collectively":[172],"shape":[173],"best":[175],"practices":[176],"research,":[179],"particularly":[180],"engineering":[182],"advancements":[183],"LLMs":[185],"push":[186],"research":[188],"focus":[189],"towards":[190],"data-driven":[191],"approaches":[192],"(e.g.,":[193],"efficiency,":[195],"alignment,":[196],"fairness).":[197],"light":[199],"this,":[201],"have":[203],"developed":[204],"guidelines":[205],"future":[207],"work.":[208],"Our":[209],"aim":[210],"draw":[213],"attention":[214],"these":[216],"limitations":[217],"community,":[220],"hope":[223],"finding":[225],"ways":[226],"address":[228],"them.":[229]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4378174044","counts_by_year":[],"updated_date":"2025-02-23T03:57:27.427437","created_date":"2023-05-26"}