{"id":"https://openalex.org/W4392873868","doi":"https://doi.org/10.48550/arxiv.2403.09455","title":"The Neural-SRP method for positional sound source localization","display_name":"The Neural-SRP method for positional sound source localization","publication_year":2024,"publication_date":"2024-03-14","ids":{"openalex":"https://openalex.org/W4392873868","doi":"https://doi.org/10.48550/arxiv.2403.09455"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.09455","pdf_url":"http://arxiv.org/pdf/2403.09455","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2403.09455","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011673214","display_name":"Eric Grinstein","orcid":"https://orcid.org/0000-0003-4502-5407"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Grinstein, Eric","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073284331","display_name":"Toon van Waterschoot","orcid":"https://orcid.org/0000-0002-6323-7350"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"van Waterschoot, Toon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004899548","display_name":"Mike Brookes","orcid":"https://orcid.org/0000-0001-7105-4936"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brookes, Mike","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5016227729","display_name":"Patrick A. Naylor","orcid":"https://orcid.org/0000-0001-8546-8013"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Naylor, Patrick A.","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":82},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9967,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9967,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12537","display_name":"Flow Measurement and Analysis","score":0.9663,"subfield":{"id":"https://openalex.org/subfields/2211","display_name":"Mechanics of Materials"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.6412317},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.49923754},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.4183641},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10979754}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.09455","pdf_url":"http://arxiv.org/pdf/2403.09455","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.09455","pdf_url":"http://arxiv.org/pdf/2403.09455","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391913857","https://openalex.org/W2909726438","https://openalex.org/W2748952813","https://openalex.org/W2478288626","https://openalex.org/W2390279801","https://openalex.org/W2382290278","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2350741829","https://openalex.org/W2001405890"],"abstract_inverted_index":{"Steered":[0],"Response":[1],"Power":[2],"(SRP)":[3],"is":[4,30],"a":[5,53,87],"widely":[6],"used":[7],"method":[8],"for":[9,52],"the":[10,91,96,128],"task":[11],"of":[12,56,93,99],"sound":[13],"source":[14],"localization":[15,21,124],"using":[16,105],"microphone":[17,82],"arrays,":[18],"showing":[19],"satisfactory":[20],"performance":[22,29,97,125],"on":[23,67,115],"many":[24],"practical":[25,65],"scenarios.":[26],"However,":[27],"its":[28],"diminished":[31],"under":[32],"highly":[33],"reverberant":[34],"environments.":[35],"Although":[36],"Deep":[37],"Neural":[38],"Networks":[39],"(DNNs)":[40],"have":[41],"been":[42],"previously":[43],"proposed":[44],"to":[45],"overcome":[46],"this":[47],"limitation,":[48],"most":[49],"are":[50],"trained":[51],"specific":[54],"number":[55],"microphones":[57],"with":[58,95],"fixed":[59],"spatial":[60],"coordinates.":[61],"This":[62],"restricts":[63],"their":[64],"application":[66,78],"scenarios":[68],"frequently":[69],"observed":[70],"in":[71],"wireless":[72],"acoustic":[73],"sensor":[74],"networks,":[75],"where":[76],"each":[77],"has":[79],"an":[80],"ad-hoc":[81],"topology.":[83],"We":[84,101],"propose":[85],"Neural-SRP,":[86],"DNN":[88],"which":[89],"combines":[90],"flexibility":[92],"SRP":[94],"gains":[98],"DNNs.":[100],"train":[102],"our":[103,113],"network":[104],"simulated":[106,118],"data":[107],"and":[108,111,117],"transfer":[109],"learning,":[110],"evaluate":[112],"approach":[114],"recorded":[116],"data.":[119],"Results":[120],"verify":[121],"that":[122],"Neural-SRP's":[123],"significantly":[126],"outperforms":[127],"baselines.":[129]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4392873868","counts_by_year":[],"updated_date":"2025-01-22T19:38:06.484390","created_date":"2024-03-16"}