{"id":"https://openalex.org/W4318541551","doi":"https://doi.org/10.1145/3575693.3575736","title":"DeepUM: Tensor Migration and Prefetching in Unified Memory","display_name":"DeepUM: Tensor Migration and Prefetching in Unified Memory","publication_year":2023,"publication_date":"2023-01-27","ids":{"openalex":"https://openalex.org/W4318541551","doi":"https://doi.org/10.1145/3575693.3575736"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3575693.3575736","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087873340","display_name":"Jaehoon Jung","orcid":"https://orcid.org/0000-0002-9562-6828"},"institutions":[],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaehoon Jung","raw_affiliation_strings":["Moreh, South Korea"],"affiliations":[{"raw_affiliation_string":"Moreh, South Korea","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006733433","display_name":"Jin-Pyo Kim","orcid":"https://orcid.org/0000-0002-4370-1195"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"funder","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jinpyo Kim","raw_affiliation_strings":["Seoul National University, South Korea"],"affiliations":[{"raw_affiliation_string":"Seoul National University, South Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100767182","display_name":"Jaejin Lee","orcid":"https://orcid.org/0000-0003-4638-8170"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"funder","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaejin Lee","raw_affiliation_strings":["Seoul National University, South Korea"],"affiliations":[{"raw_affiliation_string":"Seoul National University, South Korea","institution_ids":["https://openalex.org/I139264467"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.004,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.99996,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":95},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9986,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.98,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.88747275},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.66147137},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.64522994},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.6274636},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.5639873},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5000801},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.45881328},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3471417},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.21940774},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.100126445},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3575693.3575736","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.64,"id":"https://metadata.un.org/sdg/10"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":26,"referenced_works":["https://openalex.org/W2107354725","https://openalex.org/W2110815624","https://openalex.org/W2160395504","https://openalex.org/W2194775991","https://openalex.org/W2330958039","https://openalex.org/W2747329762","https://openalex.org/W2883283076","https://openalex.org/W2901994046","https://openalex.org/W2913059114","https://openalex.org/W2913640523","https://openalex.org/W2914304175","https://openalex.org/W2934021599","https://openalex.org/W2963341956","https://openalex.org/W2979340153","https://openalex.org/W2979826702","https://openalex.org/W2999615700","https://openalex.org/W3010830594","https://openalex.org/W3011293047","https://openalex.org/W3012479151","https://openalex.org/W3012514909","https://openalex.org/W3043443960","https://openalex.org/W3081168214","https://openalex.org/W3157864729","https://openalex.org/W4244348968","https://openalex.org/W4254589276","https://openalex.org/W4301361180"],"related_works":["https://openalex.org/W4312814274","https://openalex.org/W4285370786","https://openalex.org/W3207760230","https://openalex.org/W2536018345","https://openalex.org/W2358353312","https://openalex.org/W2353836703","https://openalex.org/W2296488620","https://openalex.org/W17155033","https://openalex.org/W1590307681","https://openalex.org/W1496222301"],"abstract_inverted_index":{"Deep":[0],"neural":[1],"networks":[2],"(DNNs)":[3],"are":[4],"continuing":[5],"to":[6,40,69,81,89,146],"get":[7],"wider":[8],"and":[9,22,79,110,113,137],"deeper.":[10],"As":[11],"a":[12,16,30,53,64],"result,":[13],"it":[14],"requires":[15],"tremendous":[17],"amount":[18],"of":[19,100],"GPU":[20,42,92,120,134],"memory":[21,43,50,121,135],"computing":[23],"power.":[24],"In":[25],"this":[26],"paper,":[27],"we":[28],"propose":[29,85],"framework":[31],"called":[32],"DeepUM":[33,62,101,129],"that":[34,128,142],"exploits":[35],"CUDA":[36],"Unified":[37],"Memory":[38],"(UM)":[39],"allow":[41],"oversubscription":[44,51,136],"for":[45,133],"DNNs.":[46],"While":[47],"UM":[48],"allows":[49],"using":[52,102],"page":[54,57,72],"fault":[55,93],"mechanism,":[56],"migration":[58,73],"introduces":[59],"enormous":[60],"overhead.":[61,74],"uses":[63],"new":[65],"correlation":[66],"prefetching":[67],"technique":[68],"hide":[70],"the":[71,91,98],"It":[75],"is":[76,130],"fully":[77],"automatic":[78],"transparent":[80],"users.":[82],"We":[83,96],"also":[84],"two":[86],"optimization":[87],"techniques":[88],"minimize":[90],"handling":[94],"time.":[95],"evaluate":[97],"performance":[99,116],"nine":[103],"large-scale":[104],"DNNs":[105],"from":[106],"MLPerf,":[107],"PyTorch":[108],"examples,":[109],"Hugging":[111],"Face":[112],"compare":[114],"its":[115],"with":[117],"six":[118],"state-of-the-art":[119],"swapping":[122],"approaches.":[123],"The":[124],"evaluation":[125],"result":[126],"indicates":[127],"very":[131],"effective":[132],"can":[138],"handle":[139],"larger":[140],"models":[141],"other":[143],"approaches":[144],"fail":[145],"handle.":[147]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4318541551","counts_by_year":[{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":3}],"updated_date":"2025-04-16T09:23:32.649126","created_date":"2023-01-31"}