{"id":"https://openalex.org/W4307927803","doi":"https://doi.org/10.48550/arxiv.2210.16422","title":"Toward Unifying Text Segmentation and Long Document Summarization","display_name":"Toward Unifying Text Segmentation and Long Document Summarization","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4307927803","doi":"https://doi.org/10.48550/arxiv.2210.16422"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2210.16422","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2210.16422","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042006948","display_name":"Sangwoo Cho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cho, Sangwoo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083752471","display_name":"Kaiqiang Song","orcid":"https://orcid.org/0000-0001-8203-9723"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Kaiqiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100334518","display_name":"Xiaoyang Wang","orcid":"https://orcid.org/0000-0003-4213-0762"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xiaoyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100394562","display_name":"Fei Liu","orcid":"https://orcid.org/0000-0001-7141-5105"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Fei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5034476404","display_name":"Dong Yu","orcid":"https://orcid.org/0000-0003-0520-6844"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Dong","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":59},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9951,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/market-segmentation","display_name":"Market Segmentation","score":0.6625831}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.93021},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.8717489},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.78851986},{"id":"https://openalex.org/C125308379","wikidata":"https://www.wikidata.org/wiki/Q363057","display_name":"Market segmentation","level":2,"score":0.6625831},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.6405957},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6098058},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5194592},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.45108327},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2210.16422","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2210.16422","pdf_url":"http://arxiv.org/pdf/2210.16422","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2210.16422","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2210.16422","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality education","score":0.65}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4205247302","https://openalex.org/W2592395359","https://openalex.org/W2535231171","https://openalex.org/W2501551404","https://openalex.org/W2468652214","https://openalex.org/W2326647871","https://openalex.org/W2130144716","https://openalex.org/W2045342254","https://openalex.org/W1504527458","https://openalex.org/W1501331687"],"abstract_inverted_index":{"Text":[0],"segmentation":[1,41,56,76,149],"is":[2,19,34,79],"important":[3,30],"for":[4,21],"signaling":[5],"a":[6,11,38,139],"document's":[7],"structure.":[8],"Without":[9],"segmenting":[10],"long":[12],"document":[13],"into":[14],"topically":[15],"coherent":[16],"sections,":[17],"it":[18],"difficult":[20],"readers":[22],"to":[23,86,103,106,143],"comprehend":[24],"the":[25,52,108,115,145],"text,":[26],"let":[27],"alone":[28],"find":[29],"information.":[31],"The":[32],"problem":[33],"only":[35,119],"exacerbated":[36],"by":[37,72,82],"lack":[39],"of":[40,44,61,89,141,147,156],"in":[42,58],"transcripts":[43,105],"audio/video":[45],"recordings.":[46],"In":[47],"this":[48],"paper,":[49],"we":[50],"explore":[51],"role":[53],"that":[54,114],"section":[55,148],"plays":[57],"extractive":[59],"summarization":[60,74],"written":[62,152],"and":[63,75,153,159],"spoken":[64,104,154],"documents.":[65],"Our":[66,111],"approach":[67],"learns":[68],"robust":[69],"sentence":[70],"representations":[71],"performing":[73],"simultaneously,":[77],"which":[78],"further":[80],"enhanced":[81],"an":[83],"optimization-based":[84],"regularizer":[85],"promote":[87],"selection":[88],"diverse":[90],"summary":[91],"sentences.":[92],"We":[93,137],"conduct":[94],"experiments":[95],"on":[96,123,150],"multiple":[97],"datasets":[98],"ranging":[99],"from":[100],"scientific":[101],"articles":[102],"evaluate":[107],"model's":[109],"performance.":[110],"findings":[112],"suggest":[113],"model":[116],"can":[117],"not":[118],"achieve":[120],"state-of-the-art":[121],"performance":[122],"publicly":[124],"available":[125],"benchmarks,":[126],"but":[127],"demonstrate":[128],"better":[129],"cross-genre":[130],"transferability":[131],"when":[132],"equipped":[133],"with":[134],"text":[135],"segmentation.":[136],"perform":[138],"series":[140],"analyses":[142],"quantify":[144],"impact":[146],"summarizing":[151],"documents":[155],"substantial":[157],"length":[158],"complexity.":[160]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4307927803","counts_by_year":[],"updated_date":"2025-03-02T02:07:20.722890","created_date":"2022-11-06"}