{"id":"https://openalex.org/W4386794859","doi":"https://doi.org/10.48550/arxiv.2309.07658","title":"DDSP-based Neural Waveform Synthesis of Polyphonic Guitar Performance from String-wise MIDI Input","display_name":"DDSP-based Neural Waveform Synthesis of Polyphonic Guitar Performance from String-wise MIDI Input","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4386794859","doi":"https://doi.org/10.48550/arxiv.2309.07658"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2309.07658","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2309.07658","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018525507","display_name":"Nicolas Jonason","orcid":"https://orcid.org/0009-0003-8553-3542"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jonason, Nicolas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100327839","display_name":"Xin Wang","orcid":"https://orcid.org/0000-0001-8246-0606"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082349516","display_name":"Erica Cooper","orcid":"https://orcid.org/0000-0002-2978-2793"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cooper, Erica","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081575688","display_name":"Lauri Juvela","orcid":"https://orcid.org/0000-0002-2201-103X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Juvela, Lauri","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054217723","display_name":"Bob L. Sturm","orcid":"https://orcid.org/0000-0003-2549-6367"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sturm, Bob L. T.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5007639385","display_name":"Junichi Yamagishi","orcid":"https://orcid.org/0000-0003-2752-3955"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yamagishi, Junichi","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":67},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.9911,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/midi","display_name":"MIDI","score":0.95383346},{"id":"https://openalex.org/keywords/guitar","display_name":"Guitar","score":0.8577602},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.47663534}],"concepts":[{"id":"https://openalex.org/C8112396","wikidata":"https://www.wikidata.org/wiki/Q80535","display_name":"MIDI","level":2,"score":0.95383346},{"id":"https://openalex.org/C95543465","wikidata":"https://www.wikidata.org/wiki/Q6607","display_name":"Guitar","level":2,"score":0.8577602},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.73511475},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6540808},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6501621},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.6304865},{"id":"https://openalex.org/C197424946","wikidata":"https://www.wikidata.org/wiki/Q1165717","display_name":"Waveform","level":3,"score":0.55207914},{"id":"https://openalex.org/C79018884","wikidata":"https://www.wikidata.org/wiki/Q622324","display_name":"Loudness","level":2,"score":0.51986957},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.47663534},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.44826517},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3987912},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34732392},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.12875369},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.104450494},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0986177},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.08692849},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2309.07658","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2309.07658","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2309.07658","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4388340484","https://openalex.org/W4385984930","https://openalex.org/W4242364395","https://openalex.org/W4220911637","https://openalex.org/W3133630535","https://openalex.org/W2992982157","https://openalex.org/W2398084541","https://openalex.org/W2386555541","https://openalex.org/W2093318920","https://openalex.org/W1564064486"],"abstract_inverted_index":{"We":[0,14,36,60],"explore":[1],"the":[2,47,64,98,102],"use":[3],"of":[4,101],"neural":[5],"synthesis":[6,92],"for":[7],"acoustic":[8],"guitar":[9],"from":[10,94],"string-wise":[11],"MIDI":[12,95],"input.":[13],"propose":[15],"four":[16,40,103],"different":[17],"systems":[18,41],"and":[19,26,32,49,56],"compare":[20],"them":[21],"with":[22],"both":[23],"objective":[24],"metrics":[25],"subjective":[27],"evaluation":[28],"against":[29],"natural":[30],"audio":[31],"a":[33,70,75],"sample-based":[34],"baseline.":[35],"iteratively":[37],"develop":[38],"these":[39],"by":[42],"making":[43],"various":[44],"considerations":[45],"on":[46],"architecture":[48],"intermediate":[50],"tasks,":[51],"such":[52],"as":[53,69],"predicting":[54],"pitch":[55],"loudness":[57],"control":[58,65],"features.":[59],"find":[61,83],"that":[62,84],"formulating":[63],"feature":[66],"prediction":[67],"task":[68,72,77],"classification":[71],"rather":[73],"than":[74],"regression":[76],"yields":[78],"better":[79],"results.":[80],"Furthermore,":[81],"we":[82],"our":[85],"simplest":[86],"proposed":[87,104],"system,":[88],"which":[89],"directly":[90],"predicts":[91],"parameters":[93],"input":[96],"performs":[97],"best":[99],"out":[100],"systems.":[105],"Audio":[106],"examples":[107],"are":[108],"available":[109],"at":[110],"https://erl-j.github.io/neural-guitar-web-supplement.":[111]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4386794859","counts_by_year":[],"updated_date":"2024-12-31T08:37:25.860545","created_date":"2023-09-16"}