{"id":"https://openalex.org/W4399695424","doi":"https://doi.org/10.48550/arxiv.2406.08900","title":"On Improving Error Resilience of Neural End-to-End Speech Coders","display_name":"On Improving Error Resilience of Neural End-to-End Speech Coders","publication_year":2024,"publication_date":"2024-06-13","ids":{"openalex":"https://openalex.org/W4399695424","doi":"https://doi.org/10.48550/arxiv.2406.08900"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2406.08900","pdf_url":"https://arxiv.org/pdf/2406.08900","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2406.08900","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102051987","display_name":"Kishan Chand Gupta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gupta, Kishan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039716073","display_name":"Nicola Pia","orcid":"https://orcid.org/0000-0003-0987-863X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pia, Nicola","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077147264","display_name":"Srikanth Korse","orcid":"https://orcid.org/0009-0008-7564-9628"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Korse, Srikanth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078105594","display_name":"Andreas Brendel","orcid":"https://orcid.org/0000-0002-6051-6346"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brendel, Andreas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054985419","display_name":"Guillaume Fuchs","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fuchs, Guillaume","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5009684245","display_name":"Markus Multrus","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Multrus, Markus","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":79},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9681,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9681,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9552,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/end-to-end-principle","display_name":"End-to-end principle","score":0.84845734},{"id":"https://openalex.org/keywords/resilience","display_name":"Resilience","score":0.68851507}],"concepts":[{"id":"https://openalex.org/C74296488","wikidata":"https://www.wikidata.org/wiki/Q2527392","display_name":"End-to-end principle","level":2,"score":0.84845734},{"id":"https://openalex.org/C2779585090","wikidata":"https://www.wikidata.org/wiki/Q3457762","display_name":"Resilience (materials science)","level":2,"score":0.68851507},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6058899},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5219706},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16911489},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2406.08900","pdf_url":"https://arxiv.org/pdf/2406.08900","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2406.08900","pdf_url":"https://arxiv.org/pdf/2406.08900","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4396701345","https://openalex.org/W4396696052","https://openalex.org/W4391375266","https://openalex.org/W3179968364","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2001405890","https://openalex.org/W1999612375"],"abstract_inverted_index":{"Error":[0,10],"resilient":[1],"tools":[2],"like":[3,23],"Packet":[4],"Loss":[5],"Concealment":[6],"(PLC)":[7],"and":[8,34,128,137,142],"Forward":[9],"Correction":[11],"(FEC)":[12],"are":[13,31],"essential":[14],"to":[15,49,52,92,101,114],"maintain":[16],"a":[17,45,69,97,112],"reliable":[18],"speech":[19,41,54,84],"communication":[20],"for":[21],"applications":[22],"Voice":[24],"over":[25],"Internet":[26],"Protocol":[27],"(VoIP),":[28],"where":[29],"packets":[30],"frequently":[32],"delayed":[33],"lost.":[35],"In":[36],"recent":[37],"times,":[38],"end-to-end":[39],"neural":[40],"codecs":[42],"have":[43],"seen":[44],"significant":[46,145],"rise,":[47],"due":[48],"their":[50,65],"ability":[51],"transmit":[53],"signal":[55],"at":[56,85,119],"low":[57,86,98],"bitrates":[58],"but":[59],"few":[60],"considerations":[61],"were":[62],"made":[63],"about":[64],"error":[66],"resilience":[67],"in":[68,106],"real":[70],"system.":[71],"Recently":[72],"introduced":[73],"Neural":[74],"End-to-End":[75],"Speech":[76],"Codec":[77],"(NESC)":[78],"can":[79],"reproduce":[80],"high":[81],"quality":[82],"natural":[83],"bitrates.":[87],"We":[88],"extend":[89],"its":[90],"robustness":[91,146],"packet":[93,148],"losses":[94],"by":[95],"adding":[96],"complexity":[99],"network":[100],"predict":[102],"the":[103,132],"codebook":[104],"indices":[105],"latent":[107],"space.":[108],"Furthermore,":[109],"we":[110],"propose":[111],"method":[113],"add":[115],"an":[116,120],"in-band":[117],"FEC":[118,143],"additional":[121],"bitrate":[122],"of":[123,134],"0.8":[124],"kbps.":[125],"Both":[126],"subjective":[127],"objective":[129],"assessment":[130],"indicate":[131],"effectiveness":[133],"proposed":[135],"methods,":[136],"demonstrate":[138],"that":[139],"coupling":[140],"PLC":[141],"provide":[144],"against":[147],"losses.":[149]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4399695424","counts_by_year":[],"updated_date":"2025-03-18T11:15:26.541403","created_date":"2024-06-15"}