{"id":"https://openalex.org/W4399282167","doi":"https://doi.org/10.1145/3650200.3656636","title":"gZCCL: Compression-Accelerated Collective Communication Framework for GPU Clusters","display_name":"gZCCL: Compression-Accelerated Collective Communication Framework for GPU Clusters","publication_year":2024,"publication_date":"2024-05-30","ids":{"openalex":"https://openalex.org/W4399282167","doi":"https://doi.org/10.1145/3650200.3656636"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3650200.3656636","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3650200.3656636","source":null,"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3650200.3656636","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100779661","display_name":"Jiajun Huang","orcid":"https://orcid.org/0000-0001-5092-3987"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"funder","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiajun Huang","raw_affiliation_strings":["University of California, Riverside, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Riverside, USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103124363","display_name":"Sheng Di","orcid":null},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sheng Di","raw_affiliation_strings":["Argonne National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052001478","display_name":"Xiaodong Yu","orcid":"https://orcid.org/0000-0001-6244-1264"},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"funder","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaodong Yu","raw_affiliation_strings":["Stevens Institute of Technology, USA"],"affiliations":[{"raw_affiliation_string":"Stevens Institute of Technology, USA","institution_ids":["https://openalex.org/I108468826"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035339023","display_name":"Yujia Zhai","orcid":"https://orcid.org/0000-0002-2688-8058"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"funder","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yujia Zhai","raw_affiliation_strings":["University of California, Riverside, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Riverside, USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100705519","display_name":"Jinyang Liu","orcid":"https://orcid.org/0000-0003-0177-502X"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"funder","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jinyang Liu","raw_affiliation_strings":["University of California, Riverside, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Riverside, USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074539156","display_name":"Yafan Huang","orcid":"https://orcid.org/0000-0001-7370-6766"},"institutions":[{"id":"https://openalex.org/I126307644","display_name":"University of Iowa","ror":"https://ror.org/036jqmy94","country_code":"US","type":"funder","lineage":["https://openalex.org/I126307644"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yafan Huang","raw_affiliation_strings":["University of Iowa, USA"],"affiliations":[{"raw_affiliation_string":"University of Iowa, USA","institution_ids":["https://openalex.org/I126307644"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059814688","display_name":"Ken Raffenetti","orcid":"https://orcid.org/0009-0003-4705-2713"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ken Raffenetti","raw_affiliation_strings":["Argonne National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100656658","display_name":"Hui Zhou","orcid":"https://orcid.org/0000-0002-4422-2911"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hui Zhou","raw_affiliation_strings":["Argonne National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100643410","display_name":"Kai Zhao","orcid":"https://orcid.org/0000-0001-5328-3962"},"institutions":[{"id":"https://openalex.org/I103163165","display_name":"Florida State University","ror":"https://ror.org/05g3dte14","country_code":"US","type":"funder","lineage":["https://openalex.org/I103163165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kai Zhao","raw_affiliation_strings":["Florida State University, USA"],"affiliations":[{"raw_affiliation_string":"Florida State University, USA","institution_ids":["https://openalex.org/I103163165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067748041","display_name":"Xiaoyi Lu","orcid":"https://orcid.org/0000-0001-7581-8905"},"institutions":[{"id":"https://openalex.org/I156087764","display_name":"University of California, Merced","ror":"https://ror.org/00d9ah105","country_code":"US","type":"funder","lineage":["https://openalex.org/I156087764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaoyi Lu","raw_affiliation_strings":["University of California, Merced, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Merced, USA","institution_ids":["https://openalex.org/I156087764"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061737717","display_name":"Zizhong Chen","orcid":"https://orcid.org/0000-0003-2578-4940"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"funder","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zizhong Chen","raw_affiliation_strings":["University of California, Riverside, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Riverside, USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046613458","display_name":"Franck Cappello","orcid":"https://orcid.org/0000-0002-7890-3934"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Franck Cappello","raw_affiliation_strings":["Argonne National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024620270","display_name":"Yanfei Guo","orcid":"https://orcid.org/0000-0002-3731-5423"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yanfei Guo","raw_affiliation_strings":["Argonne National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014920685","display_name":"Rajeev Thakur","orcid":"https://orcid.org/0000-0002-5532-3048"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rajeev Thakur","raw_affiliation_strings":["Argonne National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, USA","institution_ids":["https://openalex.org/I1282105669"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.156,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.795159,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":93},"biblio":{"volume":null,"issue":null,"first_page":"437","last_page":"448"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.997,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.997,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9937,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9926,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/lossy-compression","display_name":"Lossy compression","score":0.7906641}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.87306297},{"id":"https://openalex.org/C165021410","wikidata":"https://www.wikidata.org/wiki/Q55564","display_name":"Lossy compression","level":2,"score":0.7906641},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7886366},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5184807},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.45203155},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.42850965},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.38617826},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3627807},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.17156526},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1611759},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.12969965},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.12442407},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.09676501}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3650200.3656636","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3650200.3656636","source":null,"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2308.05199","pdf_url":"https://arxiv.org/pdf/2308.05199","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3650200.3656636","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3650200.3656636","source":null,"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":24,"referenced_works":["https://openalex.org/W2052440657","https://openalex.org/W2057332538","https://openalex.org/W2064675550","https://openalex.org/W2131613942","https://openalex.org/W2164945803","https://openalex.org/W2313344362","https://openalex.org/W2486202470","https://openalex.org/W2580688187","https://openalex.org/W2625759119","https://openalex.org/W2992612536","https://openalex.org/W2997749524","https://openalex.org/W3007005426","https://openalex.org/W3032789239","https://openalex.org/W3037979316","https://openalex.org/W3129251660","https://openalex.org/W3177445289","https://openalex.org/W3196392241","https://openalex.org/W4238128135","https://openalex.org/W4285105236","https://openalex.org/W4367147749","https://openalex.org/W4384705453","https://openalex.org/W4388105305","https://openalex.org/W4391093839","https://openalex.org/W4393183862"],"related_works":["https://openalex.org/W4384342390","https://openalex.org/W4247601675","https://openalex.org/W3180760233","https://openalex.org/W3035703949","https://openalex.org/W2888954728","https://openalex.org/W2552401318","https://openalex.org/W2547124190","https://openalex.org/W2385628723","https://openalex.org/W108076602","https://openalex.org/W1033938421"],"abstract_inverted_index":{"GPU-aware":[0,28],"collective":[1,106,110],"communication":[2],"has":[3],"become":[4],"a":[5,58],"major":[6],"bottleneck":[7],"for":[8],"modern":[9],"computing":[10,14],"platforms":[11],"as":[12,38,117,119],"GPU":[13,40],"power":[15],"rapidly":[16],"rises.":[17],"A":[18],"traditional":[19],"approach":[20],"is":[21],"to":[22,33,48,73,87,124],"directly":[23],"integrate":[24],"lossy":[25],"compression":[26],"into":[27],"collectives,":[29,103],"which":[30],"can":[31,114],"lead":[32],"serious":[34],"performance":[35,84],"issues":[36],"such":[37],"underutilized":[39],"devices":[41],"and":[42,64,95,109,127],"uncontrolled":[43],"data":[44,111,143],"distortion.":[45],"In":[46],"order":[47],"address":[49],"these":[50],"issues,":[51],"in":[52],"this":[53],"paper,":[54],"we":[55,81],"propose":[56],"gZCCL,":[57],"first-ever":[59],"general":[60],"framework":[61],"that":[62,100],"designs":[63],"optimizes":[65],"GPU-aware,":[66],"compression-enabled":[67],"collectives":[68],"with":[69,92,135],"an":[70,136],"accuracy-aware":[71,147],"design":[72],"control":[74],"error":[75],"propagation.":[76],"To":[77],"validate":[78],"our":[79,101,132,146],"framework,":[80],"evaluate":[82],"the":[83,140],"on":[85],"up":[86,123],"512":[88],"NVIDIA":[89],"A100":[90],"GPUs":[91],"real-world":[93],"applications":[94],"datasets.":[96],"Experimental":[97],"results":[98],"demonstrate":[99],"gZCCL-accelerated":[102],"including":[104],"both":[105],"computation":[107],"(Allreduce)":[108],"movement":[112],"(Scatter),":[113],"outperform":[115],"NCCL":[116],"well":[118],"Cray":[120],"MPI":[121],"by":[122],"4.5":[125],"\u00d7":[126],"28.7":[128],"\u00d7,":[129],"respectively.":[130],"Furthermore,":[131],"accuracy":[133],"evaluation":[134],"image-stacking":[137],"application":[138],"confirms":[139],"high":[141],"reconstructed":[142],"quality":[144],"of":[145],"framework.":[148]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4399282167","counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-03-23T00:45:07.420051","created_date":"2024-06-04"}