{"id":"https://openalex.org/W4390748391","doi":"https://doi.org/10.1007/s42514-023-00159-7","title":"swCUDA: Auto parallel code translation framework from CUDA to ATHREAD for new generation sunway supercomputer","display_name":"swCUDA: Auto parallel code translation framework from CUDA to ATHREAD for new generation sunway supercomputer","publication_year":2024,"publication_date":"2024-01-11","ids":{"openalex":"https://openalex.org/W4390748391","doi":"https://doi.org/10.1007/s42514-023-00159-7"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1007/s42514-023-00159-7","pdf_url":"https://link.springer.com/content/pdf/10.1007/s42514-023-00159-7.pdf","source":{"id":"https://openalex.org/S4210190911","display_name":"CCF Transactions on High Performance Computing","issn_l":"2524-4922","issn":["2524-4922","2524-4930"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310319900"],"host_organization_lineage_names":["Springer Nature","Springer Science+Business Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s42514-023-00159-7.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101290671","display_name":"Maoxue Yu","orcid":"https://orcid.org/0000-0002-7253-4947"},"institutions":[{"id":"https://openalex.org/I4210161003","display_name":"Qingdao Center of Resource Chemistry and New Materials","ror":"https://ror.org/05x85k702","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210089297","https://openalex.org/I4210161003"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Maoxue Yu","raw_affiliation_strings":["Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China","institution_ids":["https://openalex.org/I4210161003"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109673172","display_name":"Guanghao Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I4210161003","display_name":"Qingdao Center of Resource Chemistry and New Materials","ror":"https://ror.org/05x85k702","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210089297","https://openalex.org/I4210161003"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanghao Ma","raw_affiliation_strings":["Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China","institution_ids":["https://openalex.org/I4210161003"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022323692","display_name":"Zhuoya Wang","orcid":"https://orcid.org/0000-0001-8883-3979"},"institutions":[{"id":"https://openalex.org/I4210161003","display_name":"Qingdao Center of Resource Chemistry and New Materials","ror":"https://ror.org/05x85k702","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210089297","https://openalex.org/I4210161003"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhuoya Wang","raw_affiliation_strings":["Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China","institution_ids":["https://openalex.org/I4210161003"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024486204","display_name":"Shuai Tang","orcid":"https://orcid.org/0000-0003-2822-5060"},"institutions":[{"id":"https://openalex.org/I59028903","display_name":"Ocean University of China","ror":"https://ror.org/04rdtx186","country_code":"CN","type":"education","lineage":["https://openalex.org/I59028903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuai Tang","raw_affiliation_strings":["Computer Science, Ocean University of China, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Computer Science, Ocean University of China, Qingdao, China","institution_ids":["https://openalex.org/I59028903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057511134","display_name":"Yuhu Chen","orcid":"https://orcid.org/0000-0002-0228-3126"},"institutions":[{"id":"https://openalex.org/I4210161003","display_name":"Qingdao Center of Resource Chemistry and New Materials","ror":"https://ror.org/05x85k702","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210089297","https://openalex.org/I4210161003"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhu Chen","raw_affiliation_strings":["Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China","institution_ids":["https://openalex.org/I4210161003"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077687075","display_name":"Kwang\u2010Ting Cheng","orcid":"https://orcid.org/0000-0002-3885-4912"},"institutions":[{"id":"https://openalex.org/I4210161003","display_name":"Qingdao Center of Resource Chemistry and New Materials","ror":"https://ror.org/05x85k702","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210089297","https://openalex.org/I4210161003"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yucheng Wang","raw_affiliation_strings":["Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China","institution_ids":["https://openalex.org/I4210161003"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100405051","display_name":"Yuanyuan Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210161003","display_name":"Qingdao Center of Resource Chemistry and New Materials","ror":"https://ror.org/05x85k702","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210089297","https://openalex.org/I4210161003"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanyuan Liu","raw_affiliation_strings":["Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Network and Information Center, Qingdao Marine Science and Technology Center, Qingdao, China","institution_ids":["https://openalex.org/I4210161003"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007001305","display_name":"Dongning Jia","orcid":"https://orcid.org/0000-0001-5805-4931"},"institutions":[{"id":"https://openalex.org/I59028903","display_name":"Ocean University of China","ror":"https://ror.org/04rdtx186","country_code":"CN","type":"education","lineage":["https://openalex.org/I59028903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongning Jia","raw_affiliation_strings":["Computer Science, Ocean University of China, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Computer Science, Ocean University of China, Qingdao, China","institution_ids":["https://openalex.org/I59028903"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079932099","display_name":"Zhiqiang Wei","orcid":"https://orcid.org/0000-0002-2830-8301"},"institutions":[{"id":"https://openalex.org/I59028903","display_name":"Ocean University of China","ror":"https://ror.org/04rdtx186","country_code":"CN","type":"education","lineage":["https://openalex.org/I59028903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiqiang Wei","raw_affiliation_strings":["Computer Science, Ocean University of China, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Computer Science, Ocean University of China, Qingdao, China","institution_ids":["https://openalex.org/I59028903"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":2190,"currency":"EUR","value_usd":2790,"provenance":"doaj"},"apc_paid":{"value":2190,"currency":"EUR","value_usd":2790,"provenance":"doaj"},"fwci":0.0,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":84},"biblio":{"volume":"6","issue":"4","first_page":"439","last_page":"458"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9975,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9956,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7911701}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8562726},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.8355377},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7911701},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.7047988},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.52952856},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.46025762},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1691032}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1007/s42514-023-00159-7","pdf_url":"https://link.springer.com/content/pdf/10.1007/s42514-023-00159-7.pdf","source":{"id":"https://openalex.org/S4210190911","display_name":"CCF Transactions on High Performance Computing","issn_l":"2524-4922","issn":["2524-4922","2524-4930"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310319900"],"host_organization_lineage_names":["Springer Nature","Springer Science+Business Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1007/s42514-023-00159-7","pdf_url":"https://link.springer.com/content/pdf/10.1007/s42514-023-00159-7.pdf","source":{"id":"https://openalex.org/S4210190911","display_name":"CCF Transactions on High Performance Computing","issn_l":"2524-4922","issn":["2524-4922","2524-4930"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310319900"],"host_organization_lineage_names":["Springer Nature","Springer Science+Business Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[{"funder":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China","award_id":"2021YFF0704000"}],"datasets":[],"versions":[],"referenced_works_count":27,"referenced_works":["https://openalex.org/W1966078827","https://openalex.org/W1994778680","https://openalex.org/W2016888570","https://openalex.org/W2016939324","https://openalex.org/W2026448279","https://openalex.org/W2031781358","https://openalex.org/W2035687084","https://openalex.org/W2072750798","https://openalex.org/W2075745057","https://openalex.org/W2123090765","https://openalex.org/W2128120785","https://openalex.org/W2475126267","https://openalex.org/W2582572759","https://openalex.org/W2619305731","https://openalex.org/W2744007529","https://openalex.org/W2902659137","https://openalex.org/W2987526375","https://openalex.org/W3003835559","https://openalex.org/W3094076646","https://openalex.org/W3126566516","https://openalex.org/W3168039489","https://openalex.org/W3190460377","https://openalex.org/W3208078891","https://openalex.org/W3208977565","https://openalex.org/W3210190478","https://openalex.org/W4306796079","https://openalex.org/W645173616"],"related_works":["https://openalex.org/W947442053","https://openalex.org/W4313433561","https://openalex.org/W4249323025","https://openalex.org/W2983282793","https://openalex.org/W2778498407","https://openalex.org/W2317245370","https://openalex.org/W2148915962","https://openalex.org/W2030310580","https://openalex.org/W198851386","https://openalex.org/W1980160788"],"abstract_inverted_index":{"Abstract":[0],"Since":[1],"specific":[2],"hardware":[3],"characteristics":[4],"and":[5,15,68,77,106,130,155],"low-level":[6],"programming":[7],"model":[8],"are":[9,29],"adapted":[10],"to":[11,25,56,61,72,86,102,152,167,182],"both":[12],"NVIDIA":[13,161],"GPU":[14],"new":[16],"generation":[17],"Sunway":[18,26,62,145],"architecture,":[19,146],"automatically":[20],"translating":[21],"mature":[22],"CUDA":[23,58,104],"kernels":[24,28,170],"ATHREAD":[27],"realistic":[30],"but":[31],"challenging":[32],"work.":[33],"To":[34,48],"address":[35],"this":[36],"issue,":[37],"swCUDA":[38,94,164],",":[39],"an":[40,136],"auto":[41],"parallel":[42],"code":[43,96],"translation":[44,55,122],"framework":[45],"is":[46,123,165],"proposed.":[47],"that":[49],"end,":[50],"we":[51],"create":[52],"scale":[53],"affine":[54],"transform":[57],"thread":[59],"hierarchy":[60,67],"index,":[63],"directive":[64,81],"based":[65,82],"memory":[66,75],"data":[69,78],"redirection":[70],"optimization":[71],"assign":[73],"optimal":[74],"usage":[76],"stride":[79],"strategy,":[80],"grouping-calculation-asynchronous-reduction":[83],"(GCAR)":[84],"algorithm":[85],"provide":[87],"general":[88],"solution":[89],"for":[90],"random":[91],"access":[92],"issue.":[93],"utilizes":[95],"generator":[97],"ANTLR":[98],"as":[99],"compiler":[100],"frontend":[101],"parse":[103],"kernel":[105],"integrate":[107],"novel":[108],"algorithms":[109],"in":[110],"the":[111,126,144,172],"node":[112],"of":[113,149,171],"abstracted":[114],"syntax":[115],"tree":[116],"(AST)":[117],"depending":[118],"on":[119,125,143],"directives.":[120],"Automatically":[121],"performed":[124],"entire":[127],"Polybench":[128],"suite":[129],"NBody":[131],"simulation":[132],"benchmark.":[133],"We":[134],"get":[135],"average":[137,147,156],"40x":[138],"speedup":[139,148],"compared":[140,151],"with":[141],"baseline":[142],"15x":[150],"x86":[153],"CPU":[154],"27":[157],"percentage":[158],"higher":[159],"than":[160],"GPU.":[162],"Further,":[163],"implemented":[166],"translate":[168],"major":[169],"real":[173],"world":[174],"application":[175],"Gromacs.":[176],"The":[177],"translated":[178],"version":[179],"achieves":[180],"up":[181],"17x":[183],"speedup.":[184]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4390748391","counts_by_year":[],"updated_date":"2024-12-24T02:59:20.620166","created_date":"2024-01-13"}