{"id":"https://openalex.org/W4386044615","doi":"https://doi.org/10.48550/arxiv.2308.08926","title":"Explicit Estimation of Magnitude and Phase Spectra in Parallel for High-Quality Speech Enhancement","display_name":"Explicit Estimation of Magnitude and Phase Spectra in Parallel for High-Quality Speech Enhancement","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4386044615","doi":"https://doi.org/10.48550/arxiv.2308.08926"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2308.08926","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2308.08926","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072371384","display_name":"Ye-Xin Lu","orcid":"https://orcid.org/0009-0009-8026-0702"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Ye-Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014746276","display_name":"Yang Ai","orcid":"https://orcid.org/0009-0006-0157-4980"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ai, Yang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5059767940","display_name":"Zhen-Hua Ling","orcid":"https://orcid.org/0000-0001-7853-5273"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ling, Zhen-Hua","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.811105,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":67,"max":78},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9983,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9983,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9282,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C126691448","wikidata":"https://www.wikidata.org/wiki/Q2028919","display_name":"Magnitude (astronomy)","level":2,"score":0.7458397},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.57796437},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.55515707},{"id":"https://openalex.org/C44280652","wikidata":"https://www.wikidata.org/wiki/Q104837","display_name":"Phase (matter)","level":2,"score":0.5441462},{"id":"https://openalex.org/C4839761","wikidata":"https://www.wikidata.org/wiki/Q212111","display_name":"Spectral line","level":2,"score":0.42264846},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.39985034},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.23920876},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10983908},{"id":"https://openalex.org/C44870925","wikidata":"https://www.wikidata.org/wiki/Q37547","display_name":"Astrophysics","level":1,"score":0.10420698},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.06538868},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2308.08926","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2308.08926","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2308.08926","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"score":0.76,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, justice, and strong institutions"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4311345787","https://openalex.org/W3185336960","https://openalex.org/W2376418092","https://openalex.org/W2257644995","https://openalex.org/W2225665239","https://openalex.org/W2188141918","https://openalex.org/W2072983018","https://openalex.org/W2042652790","https://openalex.org/W1513444457","https://openalex.org/W1016952678"],"abstract_inverted_index":{"Phase":[0,63],"information":[1],"has":[2],"a":[3,36,53,71,107,112,124,129],"significant":[4],"impact":[5],"on":[6,140],"speech":[7,14,40,190,194,204],"perceptual":[8,224],"quality":[9,225],"and":[10,28,62,84,101,111,118,128,147,174,197,216],"intelligibility.":[11],"However,":[12],"existing":[13,202],"enhancement":[15,191,205],"methods":[16],"encounter":[17],"limitations":[18],"in":[19,38,47,65],"explicit":[20,219],"phase":[21,85,113,120,130,145,217,220],"estimation":[22,132],"due":[23],"to":[24,35,78,153,165,201],"the":[25,32,44,80,141,156,168,210,214,223],"non-structural":[26],"nature":[27],"wrapping":[29],"characteristics":[30],"of":[31,226],"phase,":[33],"leading":[34],"bottleneck":[37],"enhanced":[39,227],"quality.":[41],"To":[42],"overcome":[43],"above":[45],"issue,":[46],"this":[48],"paper,":[49],"we":[50],"proposed":[51,68,183],"MP-SENet,":[52],"novel":[54],"Speech":[55],"Enhancement":[56],"Network":[57],"that":[58,181],"explicitly":[59,138],"enhances":[60],"Magnitude":[61],"spectra":[64,86,121,150],"parallel.":[66],"The":[67,75,104],"MP-SENet":[69,157,184],"comprises":[70,106],"Transformer-embedded":[72],"encoder-decoder":[73],"architecture.":[74],"encoder":[76],"aims":[77],"encode":[79],"input":[81],"distorted":[82],"magnitude":[83,108,117,125,142,215],"into":[87,94],"time-frequency":[88,95],"representations,":[89],"which":[90],"are":[91,151],"further":[92,163,208],"fed":[93],"Transformers":[96],"for":[97,167],"alternatively":[98],"capturing":[99],"time":[100],"frequency":[102],"dependencies.":[103],"decoder":[105,110],"mask":[109],"decoder,":[114],"directly":[115],"enhancing":[116],"wrapped":[119,144],"by":[122,218],"incorporating":[123],"masking":[126],"architecture":[127],"parallel":[131],"architecture,":[133],"respectively.":[134],"Multi-level":[135],"loss":[136],"functions":[137],"defined":[139],"spectra,":[143,146],"short-time":[148],"complex":[149],"adopted":[152],"jointly":[154],"train":[155],"model.":[158],"A":[159],"metric":[160],"discriminator":[161],"is":[162],"employed":[164],"compensate":[166],"incomplete":[169],"correlation":[170],"between":[171,213],"these":[172],"losses":[173],"human":[175],"auditory":[176],"perception.":[177],"Experimental":[178],"results":[179],"demonstrate":[180],"our":[182],"achieves":[185],"state-of-the-art":[186],"performance":[187],"across":[188],"multiple":[189],"tasks,":[192],"including":[193],"denoising,":[195],"dereverberation,":[196],"bandwidth":[198],"extension.":[199],"Compared":[200],"phase-aware":[203],"methods,":[206],"it":[207],"mitigates":[209],"compensation":[211],"effect":[212],"estimation,":[221],"elevating":[222],"speech.":[228]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4386044615","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-01-02T01:07:58.707718","created_date":"2023-08-22"}