{"id":"https://openalex.org/W4395065451","doi":"https://doi.org/10.48550/arxiv.2404.13950","title":"SPLATE: Sparse Late Interaction Retrieval","display_name":"SPLATE: Sparse Late Interaction Retrieval","publication_year":2024,"publication_date":"2024-04-22","ids":{"openalex":"https://openalex.org/W4395065451","doi":"https://doi.org/10.48550/arxiv.2404.13950"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2404.13950","pdf_url":"https://arxiv.org/pdf/2404.13950","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.13950","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010326252","display_name":"Thibault Formal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Formal, Thibault","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031052064","display_name":"St\u00e9phane Clinchant","orcid":"https://orcid.org/0000-0003-2367-8837"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Clinchant, St\u00e9phane","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085566571","display_name":"Herv\u00e9 D\u00e9jean","orcid":"https://orcid.org/0000-0002-9837-5358"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"D\u00e9jean, Herv\u00e9","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5068114632","display_name":"Carlos Lassance","orcid":"https://orcid.org/0000-0002-7754-6656"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lassance, Carlos","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":78},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9912,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9912,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9689,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.46786547},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.35845175}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2404.13950","pdf_url":"https://arxiv.org/pdf/2404.13950","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2404.13950","pdf_url":"https://arxiv.org/pdf/2404.13950","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4395014643","https://openalex.org/W4391913857","https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2382290278","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2350741829","https://openalex.org/W2001405890"],"abstract_inverted_index":{"The":[0],"late":[1,24,94],"interaction":[2,25,95],"paradigm":[3],"introduced":[4],"with":[5,78,97],"ColBERT":[6,108],"stands":[7],"out":[8],"in":[9,93,109],"the":[10,60,89,117,121],"neural":[11],"Information":[12],"Retrieval":[13],"space,":[14],"offering":[15],"a":[16,40,54,74,79],"compelling":[17],"effectiveness-efficiency":[18],"trade-off":[19],"across":[20],"many":[21],"benchmarks.":[22],"Efficient":[23],"retrieval":[26,100],"is":[27],"based":[28],"on":[29],"an":[30,35,65],"optimized":[31],"multi-step":[32],"strategy,":[33],"where":[34],"approximate":[36],"search":[37],"first":[38],"identifies":[39],"set":[41],"of":[42,59],"candidate":[43,90],"documents":[44,128],"to":[45,73,87],"re-rank":[46],"exactly.":[47],"In":[48],"this":[49],"work,":[50],"we":[51],"introduce":[52],"SPLATE,":[53],"simple":[55],"and":[56],"lightweight":[57],"adaptation":[58],"ColBERTv2":[61,114,123],"model":[62],"which":[63],"learns":[64],"``MLM":[66],"adapter'',":[67],"mapping":[68],"its":[69],"frozen":[70],"token":[71],"embeddings":[72],"sparse":[75,99],"vocabulary":[76],"space":[77],"partially":[80],"learned":[81],"SPLADE":[82],"module.":[83],"This":[84],"allows":[85],"us":[86],"perform":[88],"generation":[91],"step":[92],"pipelines":[96],"traditional":[98],"techniques,":[101],"making":[102],"it":[103],"particularly":[104],"appealing":[105],"for":[106],"running":[107],"CPU":[110],"environments.":[111],"Our":[112],"SPLATE":[113],"pipeline":[115],"achieves":[116],"same":[118],"effectiveness":[119],"as":[120],"PLAID":[122],"engine":[124],"by":[125],"re-ranking":[126],"50":[127],"that":[129],"can":[130],"be":[131],"retrieved":[132],"under":[133],"10ms.":[134]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4395065451","counts_by_year":[],"updated_date":"2025-04-03T02:43:28.622085","created_date":"2024-04-24"}