{"id":"https://openalex.org/W4388585336","doi":"https://doi.org/10.48550/arxiv.2311.04797","title":"CloverLeaf on Intel Multi-Core CPUs: A Case Study in Write-Allocate Evasion","display_name":"CloverLeaf on Intel Multi-Core CPUs: A Case Study in Write-Allocate Evasion","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4388585336","doi":"https://doi.org/10.48550/arxiv.2311.04797"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2311.04797","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2311.04797","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031307529","display_name":"Jan Laukemann","orcid":"https://orcid.org/0000-0002-3776-9353"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Laukemann, Jan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087470984","display_name":"Thomas Gruber","orcid":"https://orcid.org/0000-0001-6940-2065"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gruber, Thomas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082552227","display_name":"Georg Hager","orcid":"https://orcid.org/0000-0002-8723-2781"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hager, Georg","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043806886","display_name":"Dossay Oryspayev","orcid":"https://orcid.org/0000-0002-9319-6051"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oryspayev, Dossay","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5070209050","display_name":"Gerhard Wellein","orcid":"https://orcid.org/0000-0001-7371-3026"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wellein, Gerhard","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":65},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9982,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9972,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.5914988},{"id":"https://openalex.org/keywords/xeon","display_name":"Xeon","score":0.59043956},{"id":"https://openalex.org/keywords/stencil","display_name":"Stencil","score":0.5288081},{"id":"https://openalex.org/keywords/memory-model","display_name":"Memory model","score":0.41259995}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8456754},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6761976},{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.5914988},{"id":"https://openalex.org/C145108525","wikidata":"https://www.wikidata.org/wiki/Q656154","display_name":"Xeon","level":2,"score":0.59043956},{"id":"https://openalex.org/C76752949","wikidata":"https://www.wikidata.org/wiki/Q7607499","display_name":"Stencil","level":2,"score":0.5288081},{"id":"https://openalex.org/C12186640","wikidata":"https://www.wikidata.org/wiki/Q6815743","display_name":"Memory model","level":3,"score":0.41259995},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.34786654},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.298075},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2311.04797","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.04797","pdf_url":"http://arxiv.org/pdf/2311.04797","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2311.04797","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2311.04797","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2981664121","https://openalex.org/W2936534257","https://openalex.org/W2898398754","https://openalex.org/W2773471004","https://openalex.org/W2749903484","https://openalex.org/W2526069705","https://openalex.org/W2269110805","https://openalex.org/W2214459866","https://openalex.org/W2035419609","https://openalex.org/W2024016913"],"abstract_inverted_index":{"In":[0],"this":[1,43,178],"paper":[2],"we":[3,45,69,131,164],"analyze":[4],"the":[5,9,13,36,54,72,113,136,152,173,189],"MPI-only":[6],"version":[7],"of":[8,38,53,144,154,188],"CloverLeaf":[10,114],"code":[11],"from":[12,172],"SPEChpc":[14],"2021":[15],"benchmark":[16],"suite":[17],"on":[18,121],"recent":[19],"Intel":[20,83],"Xeon":[21],"\"Ice":[22],"Lake\"":[23],"and":[24,61,94,128,201],"\"Sapphire":[25],"Rapids\"":[26],"server":[27],"CPUs.":[28,84],"We":[29,85,148,180],"observe":[30],"peculiar":[31],"breakdowns":[32,73],"in":[33,81,112,177],"performance":[34],"when":[35],"number":[37,153,191],"processes":[39,155],"is":[40,156],"prime.":[41],"Investigating":[42],"effect,":[44,192],"create":[46],"first-principles":[47],"data":[48,66,138],"traffic":[49,67],"models":[50],"for":[51,123],"each":[52],"stencil-like":[55],"hotspot":[56],"loops.":[57],"With":[58],"application":[59],"measurements":[60],"microbenchmarks":[62],"to":[63,74,98,134,160,167],"study":[64],"memory":[65,137],"behavior,":[68],"can":[70,118,165,181],"connect":[71],"SpecI2M,":[75],"a":[76,145],"new":[77],"write-allocate":[78,100],"evasion":[79,103],"feature":[80],"current":[82],"identify":[86],"conditions":[87],"under":[88],"which":[89,163],"SpecI2M":[90,158],"works":[91,104],"as":[92,194],"intended":[93],"where":[95],"it":[96],"fails":[97,159],"avoid":[99],"transfers.":[101],"Write-allocate":[102],"best":[105,124],"if":[106,151],"large":[107],"arrays":[108],"are":[109,132],"written":[110],"consecutively;":[111],"code,":[115],"non-temporal":[116],"stores":[117],"be":[119],"employed":[120],"top":[122],"results.":[125],"For":[126],"serial":[127],"full-node":[129],"cases":[130],"able":[133],"predict":[135],"volume":[139],"analytically":[140],"with":[141],"an":[142],"error":[143],"few":[146],"percent.":[147],"find":[149],"that":[150],"prime,":[157],"work":[161],"properly,":[162],"attribute":[166],"short":[168],"inner":[169],"loops":[170],"emerging":[171],"one-dimensional":[174],"domain":[175],"decomposition":[176],"case.":[179],"also":[182],"rule":[183],"out":[184],"other":[185],"possible":[186],"causes":[187],"prime":[190],"such":[193],"breaking":[195],"layer":[196],"conditions,":[197],"MPI":[198],"communication":[199],"overhead,":[200],"load":[202],"imbalance.":[203]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4388585336","counts_by_year":[],"updated_date":"2025-04-11T18:16:17.888862","created_date":"2023-11-11"}