{"id":"https://openalex.org/W4353004366","doi":"https://doi.org/10.1162/tacl_a_00547","title":"Efficient Long-Text Understanding with Short-Text Models","display_name":"Efficient Long-Text Understanding with Short-Text Models","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4353004366","doi":"https://doi.org/10.1162/tacl_a_00547"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00547","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00547/2075722/tacl_a_00547.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00547/2075722/tacl_a_00547.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041579054","display_name":"Maor Ivgi","orcid":null},"institutions":[{"id":"https://openalex.org/I16391192","display_name":"Tel Aviv University","ror":"https://ror.org/04mhzgx49","country_code":"IL","type":"funder","lineage":["https://openalex.org/I16391192"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Maor Ivgi","raw_affiliation_strings":["The Blavatnik School of Computer Science, Tel-Aviv University, Israel. maor.ivgi@cs.tau.ac.il"],"affiliations":[{"raw_affiliation_string":"The Blavatnik School of Computer Science, Tel-Aviv University, Israel. maor.ivgi@cs.tau.ac.il","institution_ids":["https://openalex.org/I16391192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088774511","display_name":"Uri Shaham","orcid":"https://orcid.org/0000-0002-5928-4269"},"institutions":[{"id":"https://openalex.org/I16391192","display_name":"Tel Aviv University","ror":"https://ror.org/04mhzgx49","country_code":"IL","type":"funder","lineage":["https://openalex.org/I16391192"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Uri Shaham","raw_affiliation_strings":["The Blavatnik School of Computer Science, Tel-Aviv University, Israel. uri.shaham@cs.tau.ac.il"],"affiliations":[{"raw_affiliation_string":"The Blavatnik School of Computer Science, Tel-Aviv University, Israel. uri.shaham@cs.tau.ac.il","institution_ids":["https://openalex.org/I16391192"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045872048","display_name":"Jonathan Berant","orcid":null},"institutions":[{"id":"https://openalex.org/I16391192","display_name":"Tel Aviv University","ror":"https://ror.org/04mhzgx49","country_code":"IL","type":"funder","lineage":["https://openalex.org/I16391192"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Jonathan Berant","raw_affiliation_strings":["The Blavatnik School of Computer Science, Tel-Aviv University, Israel. joberant@cs.tau.ac.il"],"affiliations":[{"raw_affiliation_string":"The Blavatnik School of Computer Science, Tel-Aviv University, Israel. joberant@cs.tau.ac.il","institution_ids":["https://openalex.org/I16391192"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5041579054","https://openalex.org/A5088774511","https://openalex.org/A5045872048"],"corresponding_institution_ids":["https://openalex.org/I16391192","https://openalex.org/I16391192","https://openalex.org/I16391192"],"apc_list":{"value":0,"currency":"USD","value_usd":0},"apc_paid":null,"fwci":6.262,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.796876,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"11","issue":null,"first_page":"284","last_page":"299"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9714,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scratch","display_name":"Scratch","score":0.53840494},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.5188433},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.514765},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4468054}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8839313},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.7817409},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.689856},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.64741844},{"id":"https://openalex.org/C2781235140","wikidata":"https://www.wikidata.org/wiki/Q275131","display_name":"Scratch","level":2,"score":0.53840494},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.5188433},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.514765},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4468054},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.44186068},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.43873423},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4370549},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35551506},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.33596313},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.12767327},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.11388081},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00547","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00547/2075722/tacl_a_00547.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2208.00748","pdf_url":"http://arxiv.org/pdf/2208.00748","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00547","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00547/2075722/tacl_a_00547.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.72,"display_name":"Quality education"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":37,"referenced_works":["https://openalex.org/W2889787757","https://openalex.org/W2951328433","https://openalex.org/W2963748441","https://openalex.org/W2963963993","https://openalex.org/W2965373594","https://openalex.org/W2971105107","https://openalex.org/W2979826702","https://openalex.org/W3015468748","https://openalex.org/W3033182847","https://openalex.org/W3033529678","https://openalex.org/W3034999214","https://openalex.org/W3035390927","https://openalex.org/W3105238007","https://openalex.org/W3131922516","https://openalex.org/W3153603860","https://openalex.org/W3156789018","https://openalex.org/W3161820423","https://openalex.org/W3170490008","https://openalex.org/W3171639395","https://openalex.org/W3172540065","https://openalex.org/W3201977280","https://openalex.org/W3209374680","https://openalex.org/W4200633770","https://openalex.org/W4212774754","https://openalex.org/W4221145950","https://openalex.org/W4225727438","https://openalex.org/W4225958595","https://openalex.org/W4280652569","https://openalex.org/W4281254837","https://openalex.org/W4281736354","https://openalex.org/W4283734749","https://openalex.org/W4287667694","https://openalex.org/W4287888039","https://openalex.org/W4288089799","https://openalex.org/W4323274322","https://openalex.org/W4385573804","https://openalex.org/W4389518729"],"related_works":["https://openalex.org/W322691623","https://openalex.org/W2770018148","https://openalex.org/W2475116013","https://openalex.org/W2385135707","https://openalex.org/W2358308169","https://openalex.org/W2275988210","https://openalex.org/W2140315382","https://openalex.org/W2082556335","https://openalex.org/W2066741154","https://openalex.org/W2059109728"],"abstract_inverted_index":{"Abstract":[0],"Transformer-based":[1],"pretrained":[2,77,97],"language":[3,10,136],"models":[4,147],"(LMs)":[5],"are":[6,43,149],"ubiquitous":[7],"across":[8,102,131],"natural":[9],"understanding,":[11],"but":[12],"cannot":[13],"be":[14],"applied":[15],"to":[16,28,99,151],"long":[17,25,69,117],"sequences":[18,70],"such":[19],"as":[20],"stories,":[21],"scientific":[22],"articles,":[23],"and":[24,62,73,94,120,154,158],"documents":[26],"due":[27],"their":[29],"quadratic":[30],"complexity.":[31],"While":[32],"a":[33,64,90,113,126,132,156],"myriad":[34],"of":[35,135],"efficient":[36],"transformer":[37],"variants":[38],"have":[39],"been":[40],"proposed,":[41],"they":[42],"typically":[44],"based":[45],"on":[46,124],"custom":[47],"implementations":[48],"that":[49,71,110,141,148],"require":[50,155],"expensive":[51,159],"pretraining":[52,160],"from":[53],"scratch.":[54],"In":[55],"this":[56],"work,":[57],"we":[58,80],"propose":[59],"SLED:":[60],"SLiding-Encoder":[61],"Decoder,":[63],"simple":[65],"approach":[66,123],"for":[67,116],"processing":[68],"re-uses":[72],"leverages":[74],"battle-tested":[75],"short-text":[76,91],"LMs.":[78],"Specifically,":[79],"partition":[81],"the":[82,96],"input":[83],"into":[84],"overlapping":[85],"chunks,":[86],"encode":[87],"each":[88],"with":[89,128,145],"LM":[92],"encoder":[93],"use":[95],"decoder":[98],"fuse":[100],"information":[101],"chunks":[103],"(fusion-in-decoder).":[104],"We":[105,139],"illustrate":[106],"through":[107],"controlled":[108],"experiments":[109],"SLED":[111,142],"offers":[112],"viable":[114],"strategy":[115],"text":[118],"understanding":[119,137],"evaluate":[121],"our":[122],"SCROLLS,":[125],"benchmark":[127],"seven":[129],"datasets":[130],"wide":[133],"range":[134],"tasks.":[138],"find":[140],"is":[143],"competitive":[144],"specialized":[146],"up":[150],"50x":[152],"larger":[153],"dedicated":[157],"step.":[161]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4353004366","counts_by_year":[{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":13}],"updated_date":"2025-03-20T10:56:11.986073","created_date":"2023-03-23"}