{"id":"https://openalex.org/W4377130684","doi":"https://doi.org/10.1145/3588195.3595955","title":"Accelerating MPI Collectives with Process-in-Process-based Multi-object Techniques","display_name":"Accelerating MPI Collectives with Process-in-Process-based Multi-object Techniques","publication_year":2023,"publication_date":"2023-08-07","ids":{"openalex":"https://openalex.org/W4377130684","doi":"https://doi.org/10.1145/3588195.3595955"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3588195.3595955","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"type":"preprint","type_crossref":"proceedings-article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.1145/3588195.3595955","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100779661","display_name":"Jiajun Huang","orcid":"https://orcid.org/0000-0001-5092-3987"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"funder","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiajun Huang","raw_affiliation_strings":["University of California, Riverside, Riverside, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Riverside, Riverside, CA, USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051694932","display_name":"Kaiming Ouyang","orcid":"https://orcid.org/0000-0002-4775-1835"},"institutions":[{"id":"https://openalex.org/I4210127875","display_name":"Nvidia (United States)","ror":"https://ror.org/03jdj4y14","country_code":"US","type":"funder","lineage":["https://openalex.org/I4210127875"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kaiming Ouyang","raw_affiliation_strings":["NVIDIA Corporation, Santa Clara, CA, USA"],"affiliations":[{"raw_affiliation_string":"NVIDIA Corporation, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210127875"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035339023","display_name":"Yujia Zhai","orcid":"https://orcid.org/0000-0002-2688-8058"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"funder","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yujia Zhai","raw_affiliation_strings":["University of California, Riverside, Riverside, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Riverside, Riverside, CA, USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100705519","display_name":"Jinyang Liu","orcid":"https://orcid.org/0000-0003-0177-502X"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"funder","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jinyang Liu","raw_affiliation_strings":["University of California, Riverside, Riverside, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Riverside, Riverside, CA, USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058015880","display_name":"Min Si","orcid":"https://orcid.org/0000-0002-0208-096X"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"funder","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Min Si","raw_affiliation_strings":["Meta Platforms, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Meta Platforms, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059814688","display_name":"Ken Raffenetti","orcid":"https://orcid.org/0009-0003-4705-2713"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ken Raffenetti","raw_affiliation_strings":["Argonne National Laboratory, Lemont, IL, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, Lemont, IL, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100656658","display_name":"Hui Zhou","orcid":"https://orcid.org/0000-0002-4422-2911"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hui Zhou","raw_affiliation_strings":["Argonne National Laboratory, Lemont, IL, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, Lemont, IL, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102836031","display_name":"Atsushi Hori","orcid":"https://orcid.org/0000-0002-7010-8098"},"institutions":[{"id":"https://openalex.org/I184597095","display_name":"National Institute of Informatics","ror":"https://ror.org/04ksd4g47","country_code":"JP","type":"funder","lineage":["https://openalex.org/I1319490839","https://openalex.org/I184597095","https://openalex.org/I4210158934"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Atsushi Hori","raw_affiliation_strings":["National Institute of Informatics, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"National Institute of Informatics, Tokyo, Japan","institution_ids":["https://openalex.org/I184597095"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061737717","display_name":"Zizhong Chen","orcid":"https://orcid.org/0000-0003-2578-4940"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"funder","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zizhong Chen","raw_affiliation_strings":["University of California, Riverside, Riverside, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Riverside, Riverside, CA, USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024620270","display_name":"Yanfei Guo","orcid":"https://orcid.org/0000-0002-3731-5423"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yanfei Guo","raw_affiliation_strings":["Argonne National Laboratory, Lemont, IL, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, Lemont, IL, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014920685","display_name":"Rajeev Thakur","orcid":"https://orcid.org/0000-0002-5532-3048"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"funder","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rajeev Thakur","raw_affiliation_strings":["Argonne National Laboratory, Lemont, IL, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, Lemont, IL, USA","institution_ids":["https://openalex.org/I1282105669"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":2,"citation_normalized_percentile":{"value":0.958133,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":77,"max":82},"biblio":{"volume":null,"issue":null,"first_page":"333","last_page":"334"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9974,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9974,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9966,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9966,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/message-passing-interface","display_name":"Message Passing Interface","score":0.4731532},{"id":"https://openalex.org/keywords/communication-source","display_name":"Communication source","score":0.4628422}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.90131855},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7364683},{"id":"https://openalex.org/C854659","wikidata":"https://www.wikidata.org/wiki/Q1859284","display_name":"Message passing","level":2,"score":0.5841834},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5736047},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.51735944},{"id":"https://openalex.org/C63540848","wikidata":"https://www.wikidata.org/wiki/Q3140932","display_name":"Fault tolerance","level":2,"score":0.4981556},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.49129862},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4882908},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.48821905},{"id":"https://openalex.org/C166782233","wikidata":"https://www.wikidata.org/wiki/Q127879","display_name":"Message Passing Interface","level":3,"score":0.4731532},{"id":"https://openalex.org/C198104137","wikidata":"https://www.wikidata.org/wiki/Q974688","display_name":"Communication source","level":2,"score":0.4628422},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.44720826},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.4449901},{"id":"https://openalex.org/C130795937","wikidata":"https://www.wikidata.org/wiki/Q2561570","display_name":"Remote direct memory access","level":2,"score":0.41686782},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2515272},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.23821032},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3588195.3595955","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2305.10612","pdf_url":"https://arxiv.org/pdf/2305.10612","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2305.10612","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3588195.3595955","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":["https://openalex.org/W4377130684"],"referenced_works_count":3,"referenced_works":["https://openalex.org/W2058694702","https://openalex.org/W2808584769","https://openalex.org/W2886520239"],"related_works":["https://openalex.org/W4386915331","https://openalex.org/W2751263050","https://openalex.org/W2378910916","https://openalex.org/W2361929291","https://openalex.org/W2124048060","https://openalex.org/W2116006827","https://openalex.org/W2099148634","https://openalex.org/W2086666199","https://openalex.org/W1902983110","https://openalex.org/W1511717675"],"abstract_inverted_index":{"In":[0],"the":[1],"exascale":[2],"computing":[3,11],"era,":[4],"optimizing":[5],"MPI":[6,48,55,118,131],"collective":[7,56,67],"performance":[8,19,57,99],"in":[9,104],"high-performance":[10],"(HPC)":[12],"applications":[13],"is":[14],"critical.":[15],"Current":[16],"algorithms":[17,68],"face":[18],"degradation":[20],"due":[21],"to":[22,75,128],"system":[23,78],"call":[24],"overhead,":[25,82],"page":[26,80],"faults,":[27],"or":[28],"data-copy":[29],"latency,":[30],"affecting":[31],"HPC":[32],"applications'":[33],"efficiency":[34],"and":[35,65,69,83,89,93,123,135],"scalability.":[36],"To":[37],"address":[38],"these":[39],"issues,":[40],"we":[41],"propose":[42],"PiP-MColl,":[43],"a":[44],"Process-in-Process-based":[45],"Multi-object":[46],"Inter-process":[47],"Collective":[49],"design":[50,96],"that":[51,114],"maximizes":[52],"small":[53],"message":[54,91,109],"at":[58],"scale.":[59],"PiP-MColl":[60,115],"features":[61],"efficient":[62],"multiple":[63],"sender":[64],"receiver":[66],"leverages":[70],"Process-in-Process":[71],"shared":[72],"memory":[73],"techniques":[74],"eliminate":[76],"unnecessary":[77],"call,":[79],"fault":[81],"extra":[84],"data":[85],"copy,":[86],"improving":[87],"intra-":[88],"inter-node":[90],"rate":[92],"throughput.":[94],"Our":[95],"also":[97],"boosts":[98],"for":[100,107,130],"larger":[101],"messages,":[102],"resulting":[103],"comprehensive":[105],"improvement":[106],"various":[108],"sizes.":[110],"Experimental":[111],"results":[112],"show":[113],"outperforms":[116],"popular":[117],"libraries,":[119],"including":[120],"OpenMPI,":[121],"MVAPICH2,":[122],"Intel":[124],"MPI,":[125],"by":[126],"up":[127],"4.6X":[129],"collectives":[132],"like":[133],"MPI_Scatter":[134],"MPI_Allgather.":[136]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4377130684","counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-03-19T18:59:59.350611","created_date":"2023-05-21"}