{"id":"https://openalex.org/W2906880415","doi":"https://doi.org/10.1109/cahpc.2018.8645880","title":"Hybrid MPI+openMP Implementation of eXtended Discrete Element Method","display_name":"Hybrid MPI+openMP Implementation of eXtended Discrete Element Method","publication_year":2018,"publication_date":"2018-09-01","ids":{"openalex":"https://openalex.org/W2906880415","doi":"https://doi.org/10.1109/cahpc.2018.8645880","mag":"2906880415"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/cahpc.2018.8645880","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064236947","display_name":"Abdoul Wahid Mainassara Checkaraou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abdoul Wahid Mainassara Checkaraou","raw_affiliation_strings":["Computational Engineering Department, LuXDEM Research Centre"],"affiliations":[{"raw_affiliation_string":"Computational Engineering Department, LuXDEM Research Centre","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082459013","display_name":"Alban Rousset","orcid":"https://orcid.org/0000-0002-9727-5638"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alban Rousset","raw_affiliation_strings":["Computational Engineering Department, LuXDEM Research Centre"],"affiliations":[{"raw_affiliation_string":"Computational Engineering Department, LuXDEM Research Centre","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050229692","display_name":"Xavier Besseron","orcid":"https://orcid.org/0000-0002-7783-2185"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xavier Besseron","raw_affiliation_strings":["Computational Engineering Department, LuXDEM Research Centre"],"affiliations":[{"raw_affiliation_string":"Computational Engineering Department, LuXDEM Research Centre","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020868628","display_name":"S\u00e9bastien Varrette","orcid":"https://orcid.org/0000-0001-9011-851X"},"institutions":[{"id":"https://openalex.org/I186903577","display_name":"University of Luxembourg","ror":"https://ror.org/036x5ad56","country_code":"LU","type":"education","lineage":["https://openalex.org/I186903577"]}],"countries":["LU"],"is_corresponding":false,"raw_author_name":"Sebastien Varrette","raw_affiliation_strings":["PCOG, University of Luxembourg, Luxembourg"],"affiliations":[{"raw_affiliation_string":"PCOG, University of Luxembourg, Luxembourg","institution_ids":["https://openalex.org/I186903577"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066477908","display_name":"Bernhard Peters","orcid":"https://orcid.org/0000-0002-7260-3623"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bernhard Peters","raw_affiliation_strings":["Computational Engineering Department, LuXDEM Research Centre"],"affiliations":[{"raw_affiliation_string":"Computational Engineering Department, LuXDEM Research Centre","institution_ids":[]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.696,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":6,"citation_normalized_percentile":{"value":0.840057,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":80,"max":82},"biblio":{"volume":null,"issue":null,"first_page":"450","last_page":"457"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10615","display_name":"Granular flow and fluidized beds","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10615","display_name":"Granular flow and fluidized beds","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11694","display_name":"Fluid Dynamics Simulations and Interactions","score":0.9976,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11751","display_name":"Lattice Boltzmann Simulation Studies","score":0.9914,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4725057}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.79834986},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6544875},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6177696},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.56242293},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.54186934},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.5128529},{"id":"https://openalex.org/C171872576","wikidata":"https://www.wikidata.org/wiki/Q902783","display_name":"Discrete element method","level":2,"score":0.5030348},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4725057},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.47088084},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.46124333},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.17870662},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C57879066","wikidata":"https://www.wikidata.org/wiki/Q41217","display_name":"Mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/cahpc.2018.8645880","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.62}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":21,"referenced_works":["https://openalex.org/W1556859836","https://openalex.org/W1589759203","https://openalex.org/W1983096721","https://openalex.org/W1990297162","https://openalex.org/W2011454852","https://openalex.org/W2015767328","https://openalex.org/W2021544026","https://openalex.org/W2028891745","https://openalex.org/W2041902442","https://openalex.org/W2073775990","https://openalex.org/W2182769868","https://openalex.org/W2277172374","https://openalex.org/W232758418","https://openalex.org/W2403972023","https://openalex.org/W2724109030","https://openalex.org/W2755101877","https://openalex.org/W2766769588","https://openalex.org/W2995037337","https://openalex.org/W31923072","https://openalex.org/W4292169167","https://openalex.org/W59481368"],"related_works":["https://openalex.org/W3214280620","https://openalex.org/W3191490922","https://openalex.org/W2794038527","https://openalex.org/W2765823764","https://openalex.org/W2384867379","https://openalex.org/W2329539859","https://openalex.org/W2227905990","https://openalex.org/W1996803181","https://openalex.org/W1972257371","https://openalex.org/W1582436825"],"abstract_inverted_index":{"The":[0],"Extended":[1],"Discrete":[2,17],"Element":[3,18],"Method":[4,19],"(XDEM)":[5],"is":[6,133,232],"a":[7,74,101,113,131,198,209,233,253,287,321,342],"novel":[8],"and":[9,76,82,88,125,186,213,264,292,301,316,346],"innovative":[10],"numerical":[11],"simulation":[12,69,255],"technique":[13],"that":[14],"extends":[15],"classical":[16],"(DEM)":[20],"(which":[21,188],"simulates":[22],"the":[23,33,51,95,98,104,118,158,182,193,203,250,273,279,294,310,318,326,330,354],"motion":[24],"of":[25,53,100,106,123,151,160,168,200,206,272,282,296,302,312,329,332,356,361,363],"granular":[26,54],"material),":[27],"by":[28,191],"additional":[29],"properties":[30],"such":[31,56,130,285],"as":[32,57,286],"chemical":[34],"composition,":[35],"thermodynamic":[36],"state,":[37],"stress/strain":[38],"for":[39,80,227,237],"each":[40,313],"particle.":[41],"It":[42],"has":[43,72],"been":[44],"applied":[45],"successfully":[46],"to":[47,85,116,163,218],"numerous":[48],"industries":[49],"involving":[50],"processing":[52],"materials":[55],"sand,":[58],"rock,":[59],"wood":[60],"or":[61,97,146],"coke":[62],"[16],":[63],"[17].":[64],"In":[65,128,153],"this":[66,154,276],"context,":[67],"computational":[68],"with":[70,178,197,341],"(X)DEM":[71],"become":[73],"more":[75,77,238],"essential":[78],"tool":[79],"researchers":[81],"scientific":[83],"engineers":[84],"set":[86,199],"up":[87],"explore":[89],"their":[90],"experimental":[91],"processes.":[92],"However,":[93],"increasing":[94,353],"size":[96],"accuracy":[99,245],"model":[102],"requires":[103],"use":[105],"High":[107],"Performance":[108],"Computing":[109],"(HPC)":[110],"platforms":[111],"over":[112],"parallelized":[114,177],"implementation":[115,319],"accommodate":[117],"growing":[119],"needs":[120],"in":[121,216,252],"terms":[122],"memory":[124,140,144,299],"computation":[126,195],"time.":[127],"practice,":[129],"parallelization":[132,205],"traditionally":[134],"obtained":[135],"using":[136,320],"either":[137],"MPI":[138,366],"(distributed":[139],"computing),":[141],"openMP":[142,166,184,201,204],"(shared":[143],"computing)":[145],"hybrid":[147,171],"approaches":[148],"combining":[149],"both":[150],"them.":[152],"paper,":[155],"we":[156,335],"present":[157,336],"results":[159,308,340],"our":[161,337],"effort":[162],"implement":[164],"an":[165],"version":[167],"XDEM":[169,207,231],"allowing":[170],"MPI+openMP":[172,339],"simulations":[173],"(XDEM":[174],"being":[175],"already":[176],"MPI).":[179],"Far":[180],"from":[181],"basic":[183],"paradigm":[185],"recommendations":[187],"simply":[189],"summarizes":[190],"decorating":[192],"main":[194,225],"loops":[196],"pragma),":[202],"required":[208],"fundamental":[210],"code":[211,235],"re-factoring":[212],"careful":[214],"tuning":[215],"order":[217],"reach":[219],"good":[220],"performance.":[221,248],"There":[222],"are":[223,256],"two":[224],"reasons":[226],"those":[228],"difficulties.":[229],"Firstly,":[230],"legacy":[234],"developed":[236],"than":[239,247],"10":[240],"years,":[241],"initially":[242],"focused":[243],"on":[244,325],"rather":[246],"Secondly,":[249],"particles":[251],"DEM":[254],"highly":[257],"dynamic:":[258],"they":[259],"can":[260,267],"be":[261],"added,":[262],"deleted":[263],"interaction":[265],"relations":[266],"change":[268],"at":[269],"any":[270],"timestep":[271],"simulation.":[274],"Thus":[275],"article":[277],"details":[278],"multiple":[280],"layers":[281],"optimization":[283,314],"applied,":[284],"deep":[288],"data":[289],"structure":[290],"profiling":[291],"reorganization,":[293],"usage":[295],"fast":[297],"multithreaded":[298],"allocators":[300],"advanced":[303],"process/thread-to-core":[304],"pinning":[305],"techniques.":[306],"Experimental":[307],"evaluate":[309],"benefit":[311],"individually":[315],"validate":[317],"real-world":[322],"application":[323],"executed":[324],"HPC":[327],"platform":[328],"University":[331],"Luxembourg.":[333],"Finally,":[334],"Hybrid":[338],"15%-20%":[343],"performance":[344],"gain":[345],"how":[347],"it":[348],"overcomes":[349],"scalability":[350],"limits":[351],"(by":[352],"number":[355],"compute":[357],"cores":[358],"without":[359],"dropping":[360],"performances)":[362],"XDEM-based":[364],"pure":[365],"simulations.":[367]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2906880415","counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1}],"updated_date":"2025-01-09T05:34:57.968741","created_date":"2019-01-11"}