{"id":"https://openalex.org/W4396814770","doi":"https://doi.org/10.48550/arxiv.2405.04272","title":"BUDDy: Single-Channel Blind Unsupervised Dereverberation with Diffusion\n Models","display_name":"BUDDy: Single-Channel Blind Unsupervised Dereverberation with Diffusion\n Models","publication_year":2024,"publication_date":"2024-05-07","ids":{"openalex":"https://openalex.org/W4396814770","doi":"https://doi.org/10.48550/arxiv.2405.04272"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2405.04272","pdf_url":"https://arxiv.org/pdf/2405.04272","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.04272","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030929567","display_name":"Eloi Moliner","orcid":"https://orcid.org/0000-0001-5719-326X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Moliner, Eloi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006784595","display_name":"Jean-Marie Lemercier","orcid":"https://orcid.org/0000-0002-8704-7658"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lemercier, Jean-Marie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037310428","display_name":"Simon Welker","orcid":"https://orcid.org/0000-0002-6349-8462"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Welker, Simon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087022569","display_name":"Timo Gerkmann","orcid":"https://orcid.org/0000-0002-8678-4699"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gerkmann, Timo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5021963945","display_name":"Vesa V\u00e4lim\u00e4ki","orcid":"https://orcid.org/0000-0002-7869-292X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"V\u00e4lim\u00e4ki, Vesa","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":83},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9783,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9783,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.972,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4996264},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.4850799},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47871757},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3930899},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.33691904},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.14438081},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10646328},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2405.04272","pdf_url":"https://arxiv.org/pdf/2405.04272","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2405.04272","pdf_url":"https://arxiv.org/pdf/2405.04272","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4396701345","https://openalex.org/W4396696052","https://openalex.org/W4395014643","https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2382290278","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2001405890"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,98,116],"present":[4],"an":[5,73],"unsupervised":[6,113],"single-channel":[7],"method":[8,108],"for":[9,36,81],"joint":[10],"blind":[11,112,128],"dereverberation":[12,102],"and":[13,40,115,133],"room":[14,90],"impulse":[15,91],"response":[16,92],"estimation,":[17],"based":[18],"on":[19],"posterior":[20],"sampling":[21],"with":[22,33,68],"diffusion":[23,55,75],"models.":[24],"We":[25],"parameterize":[26],"the":[27,43,47,53,62,65,69,89],"reverberation":[28],"operator":[29],"using":[30],"a":[31,78],"filter":[32],"exponential":[34],"decay":[35],"each":[37],"frequency":[38],"subband,":[39],"iteratively":[41],"estimate":[42],"corresponding":[44],"parameters":[45],"as":[46],"speech":[48,67,83],"utterance":[49],"gets":[50],"refined":[51],"along":[52],"reverse":[54],"trajectory.":[56],"A":[57],"measurement":[58],"consistency":[59],"criterion":[60],"enforces":[61],"fidelity":[63],"of":[64,88],"generated":[66],"reverberant":[70],"measurement,":[71],"while":[72],"unconditional":[74],"model":[76],"implements":[77],"strong":[79],"prior":[80],"clean":[82],"generation.":[84],"Without":[85],"any":[86,94],"knowledge":[87],"nor":[93],"coupled":[95],"reverberant-anechoic":[96],"data,":[97],"can":[99],"successfully":[100],"perform":[101],"in":[103,125],"various":[104],"acoustic":[105,123],"scenarios.":[106],"Our":[107],"significantly":[109],"outperforms":[110],"previous":[111],"baselines,":[114],"demonstrate":[117],"its":[118],"increased":[119],"robustness":[120],"to":[121,127],"unseen":[122],"conditions":[124],"comparison":[126],"supervised":[129],"methods.":[130],"Audio":[131],"samples":[132],"code":[134],"are":[135],"available":[136],"online.":[137]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4396814770","counts_by_year":[],"updated_date":"2025-01-08T23:46:06.305836","created_date":"2024-05-11"}