{"id":"https://openalex.org/W3137678309","doi":"https://doi.org/10.1109/bigdata50022.2020.9378438","title":"A Study of Spoken Audio Processing using Machine Learning for Libraries, Archives and Museums (LAM)","display_name":"A Study of Spoken Audio Processing using Machine Learning for Libraries, Archives and Museums (LAM)","publication_year":2020,"publication_date":"2020-12-10","ids":{"openalex":"https://openalex.org/W3137678309","doi":"https://doi.org/10.1109/bigdata50022.2020.9378438","mag":"3137678309"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata50022.2020.9378438","pdf_url":null,"source":{"id":"https://openalex.org/S4363607718","display_name":"2021 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101883722","display_name":"Weijia Xu","orcid":"https://orcid.org/0000-0002-5134-6381"},"institutions":[],"countries":["US"],"is_corresponding":false,"raw_author_name":"Weijia Xu","raw_affiliation_strings":["Texas Advanced Computing Center, University of Texas at Austin, Austin, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Texas Advanced Computing Center, University of Texas at Austin, Austin, Texas, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078797277","display_name":"Mar\u00eda Esteva","orcid":"https://orcid.org/0000-0001-6204-4517"},"institutions":[],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maria Esteva","raw_affiliation_strings":["Texas Advanced Computing Center, University of Texas at Austin, Austin, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Texas Advanced Computing Center, University of Texas at Austin, Austin, Texas, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010080547","display_name":"Peter Cui","orcid":null},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Peter Cui","raw_affiliation_strings":["Department of Computer Science, University of Texas at Austin, Austin, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Texas at Austin, Austin, Texas, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040568201","display_name":"Eugene Castillo","orcid":null},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eugene Castillo","raw_affiliation_strings":["Department of Computer Science, University of Texas at Austin, Austin, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Texas at Austin, Austin, Texas, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031190010","display_name":"Kewen Wang","orcid":"https://orcid.org/0000-0002-0542-3761"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kewen Wang","raw_affiliation_strings":["Department of Computer Science, University of Texas at Austin, Austin, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Texas at Austin, Austin, Texas, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005553832","display_name":"H. Kenneth Hopkins","orcid":null},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hanna-Robbins Hopkins","raw_affiliation_strings":["Department of English, University of Texas at Austin, Austin, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Department of English, University of Texas at Austin, Austin, Texas, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087287236","display_name":"Tanya Clement","orcid":null},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tanya Clement","raw_affiliation_strings":["Department of English, University of Texas at Austin, Austin, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Department of English, University of Texas at Austin, Austin, Texas, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078405142","display_name":"Aaron Choate","orcid":null},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aaron Choate","raw_affiliation_strings":["University of Texas Libraries, University of Texas at Austin, Austin, Texas, USA"],"affiliations":[{"raw_affiliation_string":"University of Texas Libraries, University of Texas at Austin, Austin, Texas, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057218817","display_name":"Ruizhu Huang","orcid":"https://orcid.org/0000-0003-3285-1945"},"institutions":[],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ruizhu Huang","raw_affiliation_strings":["Texas Advanced Computing Center, University of Texas at Austin, Austin, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Texas Advanced Computing Center, University of Texas at Austin, Austin, Texas, USA","institution_ids":[]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.131,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.214341,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":60,"max":69},"biblio":{"volume":null,"issue":null,"first_page":"1939","last_page":"1948"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription","score":0.6944836},{"id":"https://openalex.org/keywords/sync","display_name":"sync","score":0.6083766}],"concepts":[{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.8854543},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.83769363},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8376786},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.6944836},{"id":"https://openalex.org/C177291462","wikidata":"https://www.wikidata.org/wiki/Q423038","display_name":"Active listening","level":2,"score":0.6135624},{"id":"https://openalex.org/C3913047","wikidata":"https://www.wikidata.org/wiki/Q1956265","display_name":"sync","level":3,"score":0.6083766},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.45058838},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4418887},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.42369834},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.32200962},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.23331377},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata50022.2020.9378438","pdf_url":null,"source":{"id":"https://openalex.org/S4363607718","display_name":"2021 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality education","id":"https://metadata.un.org/sdg/4","score":0.76}],"grants":[{"funder":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation","award_id":null}],"datasets":[],"versions":[],"referenced_works_count":45,"referenced_works":["https://openalex.org/W118756463","https://openalex.org/W1532325895","https://openalex.org/W1551709509","https://openalex.org/W1600744878","https://openalex.org/W1677683623","https://openalex.org/W1922655562","https://openalex.org/W2061809273","https://openalex.org/W2077236205","https://openalex.org/W2080213370","https://openalex.org/W2097207027","https://openalex.org/W2112739286","https://openalex.org/W2117671523","https://openalex.org/W2136743277","https://openalex.org/W2143612262","https://openalex.org/W2145565586","https://openalex.org/W2147229751","https://openalex.org/W2147627917","https://openalex.org/W2155273149","https://openalex.org/W2160815625","https://openalex.org/W2169189000","https://openalex.org/W2172256532","https://openalex.org/W2191333630","https://openalex.org/W2193413348","https://openalex.org/W2277583061","https://openalex.org/W2293634267","https://openalex.org/W2309460698","https://openalex.org/W2474251382","https://openalex.org/W2587195211","https://openalex.org/W2790357563","https://openalex.org/W2802642435","https://openalex.org/W2802787326","https://openalex.org/W2820734700","https://openalex.org/W2894054914","https://openalex.org/W2896457183","https://openalex.org/W2913768775","https://openalex.org/W2953039584","https://openalex.org/W2953356739","https://openalex.org/W2953384591","https://openalex.org/W2964165818","https://openalex.org/W2993258659","https://openalex.org/W3133806040","https://openalex.org/W327991062","https://openalex.org/W4213009331","https://openalex.org/W4235637372","https://openalex.org/W4294152847"],"related_works":["https://openalex.org/W2607244263","https://openalex.org/W2524993630","https://openalex.org/W2475724061","https://openalex.org/W2392768766","https://openalex.org/W2317723112","https://openalex.org/W2234430299","https://openalex.org/W2063547430","https://openalex.org/W2058118494","https://openalex.org/W1831690014","https://openalex.org/W1561022130"],"abstract_inverted_index":{"As":[0],"the":[1,20,34,84,135,139,145,157,209,216,229],"need":[2,21],"to":[3,6,22,33,45,100,162,172,176,192,236,239],"provide":[4,185],"access":[5],"spoken":[7],"word":[8],"audio":[9,29,35,71,112],"collections":[10,72],"in":[11,73,194],"libraries,":[12],"archives,":[13],"and":[14,26,40,62,92,138,150,182,184,215],"museums":[15],"(LAM)":[16],"increases,":[17],"so":[18],"does":[19],"process":[23],"them":[24],"efficiently":[25],"consistently.":[27],"Traditionally,":[28],"processing":[30,69],"involves":[31],"listening":[32],"files,":[36],"conducting":[37],"manual":[38],"transcription,":[39],"applying":[41],"controlled":[42],"subject":[43],"terms":[44],"describe":[46,101],"them.":[47,104],"This":[48],"workflow":[49,153,189],"takes":[50],"significant":[51],"time":[52],"with":[53,78,196],"each":[54,102],"recording.":[55],"In":[56],"this":[57,188],"study,":[58],"we":[59,125,241],"investigate":[60],"if":[61],"how":[63],"machine":[64],"learning":[65],"(ML)":[66],"can":[67],"facilitate":[68],"of":[70,87,103,208,218,231],"a":[74,206],"manner":[75],"that":[76,96,219],"corresponds":[77],"LAM":[79,167,197],"best":[80],"practices.":[81],"We":[82],"use":[83],"StoryCorps":[85],"collection":[86],"oral":[88],"histories":[89],"\"Las":[90],"Historias,\"":[91],"fixed":[93],"subjects":[94],"(metadata)":[95],"are":[97,114,147],"manually":[98,233],"assigned":[99,234],"Our":[105],"methodology":[106],"has":[107,202],"two":[108,118],"main":[109],"phases.":[110],"First,":[111],"files":[113],"automatically":[115],"transcribed":[116],"using":[117,134,232],"automatic":[119],"speech":[120],"recognition":[121],"(ASR)":[122],"methods.":[123],"Next,":[124],"build":[126,237],"different":[127,212],"supervised":[128],"ML":[129,174],"models":[130],"for":[131,166,245],"label":[132,222],"prediction":[133,223],"transcription":[136,213],"data":[137],"existing":[140],"metadata.":[141],"Throughout":[142],"these":[143],"phases":[144],"results":[146],"analyzed":[148],"quantitatively":[149],"qualitatively.":[151],"The":[152,200,225],"is":[154],"implemented":[155],"within":[156],"flexible":[158],"web":[159],"framework":[160],"IDOLS":[161],"lower":[163],"technical":[164],"barriers":[165],"professionals.":[168],"By":[169],"allowing":[170],"users":[171,191],"submit":[173],"jobs":[175],"supercomputers,":[177],"reproduce":[178],"workflows,":[179],"change":[180],"configurations,":[181],"view":[183],"feedback":[186],"transparently,":[187],"allows":[190],"be":[193],"sync":[195],"professional":[198],"values.":[199],"study":[201,226],"several":[203],"outcomes":[204],"including":[205],"comparison":[207],"quality":[210,220],"between":[211],"methods":[214],"impact":[217],"on":[221],"accuracy.":[224],"also":[227],"unveiled":[228],"limitations":[230],"metadata":[235],"models,":[238],"which":[240],"suggest":[242],"alternate":[243],"strategies":[244],"building":[246],"successful":[247],"training":[248],"data.":[249]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3137678309","counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2024-12-29T14:40:16.728886","created_date":"2021-03-29"}