{"id":"https://openalex.org/W1895923153","doi":"https://doi.org/10.1109/ipdps.2000.846065","title":"Load balancing strategies for dense linear algebra kernels on heterogeneous two-dimensional grids","display_name":"Load balancing strategies for dense linear algebra kernels on heterogeneous two-dimensional grids","publication_year":2002,"publication_date":"2002-11-07","ids":{"openalex":"https://openalex.org/W1895923153","doi":"https://doi.org/10.1109/ipdps.2000.846065","mag":"1895923153"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2000.846065","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064515122","display_name":"Olivier Beaumont","orcid":"https://orcid.org/0000-0003-2741-6228"},"institutions":[{"id":"https://openalex.org/I113428412","display_name":"\u00c9cole Normale Sup\u00e9rieure de Lyon","ror":"https://ror.org/04zmssz18","country_code":"FR","type":"education","lineage":["https://openalex.org/I113428412","https://openalex.org/I203339264"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"O. Beaumont","raw_affiliation_strings":["Ecole normale superieure de Lyon FRANCE"],"affiliations":[{"raw_affiliation_string":"Ecole normale superieure de Lyon FRANCE","institution_ids":["https://openalex.org/I113428412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111973497","display_name":"Vincent Boudet","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"V. Boudet","raw_affiliation_strings":["Regularity and massive parallel computing"],"affiliations":[{"raw_affiliation_string":"Regularity and massive parallel computing","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089282120","display_name":"Fabrice Rastello","orcid":"https://orcid.org/0000-0002-6589-9956"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"F. Rastello","raw_affiliation_strings":["Regularity and massive parallel computing"],"affiliations":[{"raw_affiliation_string":"Regularity and massive parallel computing","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001838181","display_name":"Yves Robert","orcid":"https://orcid.org/0000-0003-2361-055X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Y. Robert","raw_affiliation_strings":["Regularity and massive parallel computing"],"affiliations":[{"raw_affiliation_string":"Regularity and massive parallel computing","institution_ids":[]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.838356,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":73,"max":75},"biblio":{"volume":null,"issue":null,"first_page":"783","last_page":"792"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9974,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/linear-algebra","display_name":"Linear algebra","score":0.7664507},{"id":"https://openalex.org/keywords/workstation","display_name":"Workstation","score":0.6082462},{"id":"https://openalex.org/keywords/numerical-linear-algebra","display_name":"Numerical Linear Algebra","score":0.49308917},{"id":"https://openalex.org/keywords/symmetric-multiprocessor-system","display_name":"Symmetric multiprocessor system","score":0.4567988},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.42803913}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.767833},{"id":"https://openalex.org/C139352143","wikidata":"https://www.wikidata.org/wiki/Q82571","display_name":"Linear algebra","level":2,"score":0.7664507},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7303571},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7215271},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.6648674},{"id":"https://openalex.org/C67953723","wikidata":"https://www.wikidata.org/wiki/Q192525","display_name":"Workstation","level":2,"score":0.6082462},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.6073521},{"id":"https://openalex.org/C158207573","wikidata":"https://www.wikidata.org/wiki/Q5747224","display_name":"Heterogeneous network","level":4,"score":0.5956882},{"id":"https://openalex.org/C2780595030","wikidata":"https://www.wikidata.org/wiki/Q3860309","display_name":"Multiplication (music)","level":2,"score":0.59158915},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5789788},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5747085},{"id":"https://openalex.org/C66882249","wikidata":"https://www.wikidata.org/wiki/Q169336","display_name":"Homogeneous","level":2,"score":0.56711996},{"id":"https://openalex.org/C163834973","wikidata":"https://www.wikidata.org/wiki/Q2004891","display_name":"Numerical linear algebra","level":3,"score":0.49308917},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4886108},{"id":"https://openalex.org/C172430144","wikidata":"https://www.wikidata.org/wiki/Q17111997","display_name":"Symmetric multiprocessor system","level":2,"score":0.4567988},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4486716},{"id":"https://openalex.org/C138959212","wikidata":"https://www.wikidata.org/wiki/Q1806783","display_name":"Load balancing (electrical power)","level":3,"score":0.4324332},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.42803913},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.2792797},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.26415533},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13939407},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.07409608},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2000.846065","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://hal.inria.fr/hal-00856649","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://inria.hal.science/hal-00856649","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":14,"referenced_works":["https://openalex.org/W1564226586","https://openalex.org/W2010357511","https://openalex.org/W2012309011","https://openalex.org/W2030167104","https://openalex.org/W2050487400","https://openalex.org/W2082292996","https://openalex.org/W2087314423","https://openalex.org/W2093608182","https://openalex.org/W2117293168","https://openalex.org/W2154750565","https://openalex.org/W2925006810","https://openalex.org/W3007818428","https://openalex.org/W4239025233","https://openalex.org/W4289883074"],"related_works":["https://openalex.org/W4225552076","https://openalex.org/W4205760564","https://openalex.org/W3163773192","https://openalex.org/W2995201243","https://openalex.org/W278443433","https://openalex.org/W2522245970","https://openalex.org/W2500257945","https://openalex.org/W2061048205","https://openalex.org/W2021525945","https://openalex.org/W2007578977"],"abstract_inverted_index":{"We":[0,62],"study":[1,65],"the":[2,29,49,56,59,73,81,84],"implementation":[3],"of":[4,21,46,58,83,88,100],"dense":[5],"linear":[6,14],"algebra":[7],"computations,":[8],"such":[9],"as":[10],"matrix":[11],"multiplication":[12],"and":[13,33,64],"system":[15],"solvers,":[16],"on":[17,52,75],"two-dimensional":[18],"(2D)":[19],"grids":[20,54],"heterogeneous":[22,53,76,98],"processors.":[23,85],"For":[24],"these":[25,89],"operations,":[26],"2D-grids":[27,77],"are":[28],"key":[30],"to":[31,55,80],"scalability":[32],"efficiency.":[34],"The":[35,86],"uniform":[36],"block-cyclic":[37],"data":[38,68],"distribution":[39],"scheme":[40],"commonly":[41],"used":[42],"for":[43,96],"homogeneous":[44],"collections":[45],"processors":[47],"limits":[48],"performance-of-these":[50],"operations":[51],"speed":[57],"slowest":[60],"processor.":[61],"present":[63],"more":[66],"sophisticated":[67],"allocation":[69],"strategies":[70,90],"that":[71],"balance":[72],"load":[74],"with":[78],"respect":[79],"performance":[82],"usefulness":[87],"is":[91],"demonstrated":[92],"by":[93],"simulation":[94],"measurements":[95],"a":[97],"network":[99],"workstations.":[101]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W1895923153","counts_by_year":[],"updated_date":"2024-12-07T18:32:20.419413","created_date":"2016-06-24"}