{"id":"https://openalex.org/W2013156670","doi":"https://doi.org/10.1109/pact.2011.68","title":"An Evaluation of Vectorizing Compilers","display_name":"An Evaluation of Vectorizing Compilers","publication_year":2011,"publication_date":"2011-10-01","ids":{"openalex":"https://openalex.org/W2013156670","doi":"https://doi.org/10.1109/pact.2011.68","mag":"2013156670"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact.2011.68","pdf_url":null,"source":{"id":"https://openalex.org/S4306419751","display_name":"International Conference on Parallel Architectures and Compilation Techniques","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":"http://polaris.cs.uiuc.edu/%7Egarzaran/doc/pact11.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077514991","display_name":"Saeed Maleki","orcid":"https://orcid.org/0000-0003-1107-1827"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Saeed Maleki","raw_affiliation_strings":["[Dept. of Computer Science, University of Illinois at Urbana-Champaign, Urbana, IL, USA]"],"affiliations":[{"raw_affiliation_string":"[Dept. of Computer Science, University of Illinois at Urbana-Champaign, Urbana, IL, USA]","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101439379","display_name":"Yaoqing Gao","orcid":"https://orcid.org/0000-0002-5392-5088"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yaoqing Gao","raw_affiliation_strings":["IBM Toronto Lab., Markham, ON, Canada"],"affiliations":[{"raw_affiliation_string":"IBM Toronto Lab., Markham, ON, Canada","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110864141","display_name":"Mar\u00eda Jes\u00fas Garzar\u00e1n","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mar\u00eda J. Garzar\u00e1n","raw_affiliation_strings":["[Dept. of Computer Science, University of Illinois at Urbana-Champaign, Urbana, IL, USA]"],"affiliations":[{"raw_affiliation_string":"[Dept. of Computer Science, University of Illinois at Urbana-Champaign, Urbana, IL, USA]","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018991067","display_name":"Tommy Wong","orcid":"https://orcid.org/0000-0002-0551-9827"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tommy Wong","raw_affiliation_strings":["IBM Toronto Lab., Markham, ON, Canada"],"affiliations":[{"raw_affiliation_string":"IBM Toronto Lab., Markham, ON, Canada","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109071293","display_name":"David Padua","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David A. Padua","raw_affiliation_strings":["[Dept. of Computer Science, University of Illinois at Urbana-Champaign, Urbana, IL, USA]"],"affiliations":[{"raw_affiliation_string":"[Dept. of Computer Science, University of Illinois at Urbana-Champaign, Urbana, IL, USA]","institution_ids":["https://openalex.org/I157725225"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":6.435,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":193,"citation_normalized_percentile":{"value":0.967193,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"372","last_page":"382"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9981,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9979,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.8264381},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7903687},{"id":"https://openalex.org/keywords/petascale-computing","display_name":"Petascale computing","score":0.77612025},{"id":"https://openalex.org/keywords/intrinsics","display_name":"Intrinsics","score":0.7302012},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.6683488},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.41821653}],"concepts":[{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.9228274},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8866482},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.8264381},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7903687},{"id":"https://openalex.org/C185410017","wikidata":"https://www.wikidata.org/wiki/Q7171778","display_name":"Petascale computing","level":3,"score":0.77612025},{"id":"https://openalex.org/C2908650547","wikidata":"https://www.wikidata.org/wiki/Q20999234","display_name":"Intrinsics","level":2,"score":0.7302012},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.69524693},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.6683488},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.56899285},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.41821653},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4122383},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.23647231},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact.2011.68","pdf_url":null,"source":{"id":"https://openalex.org/S4306419751","display_name":"International Conference on Parallel Architectures and Compilation Techniques","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.221.2118","pdf_url":"http://polaris.cs.uiuc.edu/%7Egarzaran/doc/pact11.pdf","source":{"id":"https://openalex.org/S4306400349","display_name":"CiteSeer X (The Pennsylvania State University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I130769515","host_organization_name":"Pennsylvania State University","host_organization_lineage":["https://openalex.org/I130769515"],"host_organization_lineage_names":["Pennsylvania State University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.221.2118","pdf_url":"http://polaris.cs.uiuc.edu/%7Egarzaran/doc/pact11.pdf","source":{"id":"https://openalex.org/S4306400349","display_name":"CiteSeer X (The Pennsylvania State University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I130769515","host_organization_name":"Pennsylvania State University","host_organization_lineage":["https://openalex.org/I130769515"],"host_organization_lineage_names":["Pennsylvania State University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Quality education","id":"https://metadata.un.org/sdg/4","score":0.66}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":20,"referenced_works":["https://openalex.org/W1560149279","https://openalex.org/W1595548352","https://openalex.org/W1967810725","https://openalex.org/W1985410827","https://openalex.org/W1999172993","https://openalex.org/W2015284894","https://openalex.org/W2034186738","https://openalex.org/W2092492242","https://openalex.org/W2099404643","https://openalex.org/W2108283760","https://openalex.org/W2114279700","https://openalex.org/W2143964612","https://openalex.org/W2144433126","https://openalex.org/W2167639788","https://openalex.org/W2264086856","https://openalex.org/W2323216115","https://openalex.org/W2543027172","https://openalex.org/W3140574618","https://openalex.org/W4245302940","https://openalex.org/W4248327003"],"related_works":["https://openalex.org/W4313423325","https://openalex.org/W4234143480","https://openalex.org/W4213329980","https://openalex.org/W2979513934","https://openalex.org/W2778498407","https://openalex.org/W2623389408","https://openalex.org/W2351155539","https://openalex.org/W2013156670","https://openalex.org/W1970451660","https://openalex.org/W1939907483"],"abstract_inverted_index":{"Most":[0],"of":[1,50,67,116],"today's":[2],"processors":[3],"include":[4],"vector":[5,17,24],"units":[6],"that":[7,102],"have":[8],"been":[9],"designed":[10],"to":[11,46],"speedup":[12],"single":[13],"threaded":[14],"programs.":[15],"Although":[16],"instructions":[18],"can":[19],"deliver":[20],"high":[21,33],"performance,":[22],"writing":[23],"code":[25],"in":[26,32,108,110,119],"assembly":[27],"language":[28],"or":[29],"using":[30,53],"intrinsics":[31],"level":[34],"languages":[35],"is":[36,45],"a":[37,63,125],"time":[38],"consuming":[39],"and":[40,78,95,123],"error-prone":[41],"task.":[42],"The":[43],"alternative":[44],"automate":[47],"the":[48,105,111,117,120,129,135],"process":[49],"vectorization":[51,109],"by":[52,134],"vectorizing":[54],"compilers.":[55],"This":[56],"paper":[57],"evaluates":[58],"how":[59],"well":[60],"compilers":[61,136],"vectorize":[62],"synthetic":[64,121],"benchmark":[65,122],"consisting":[66],"151":[68],"loops,":[69],"two":[70],"application":[71],"from":[72,81,128],"Petascale":[73],"Application":[74],"Collaboration":[75],"Teams":[76],"(PACT),":[77],"eight":[79],"applications":[80,131],"Media":[82],"Bench":[83],"II.":[84],"We":[85],"evaluated":[86],"three":[87],"compilers:":[88],"GCC":[89],"(version":[90,93,97],"4.7.0),":[91],"ICC":[92],"12.0)":[94],"XLC":[96],"11.01).":[98],"Our":[99],"results":[100],"show":[101],"despite":[103],"all":[104],"work":[106],"done":[107],"last":[112],"40":[113],"years":[114],"45-71%":[115],"loops":[118,127],"only":[124],"few":[126],"real":[130],"are":[132],"vectorized":[133],"we":[137],"evaluated.":[138]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2013156670","counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":15},{"year":2019,"cited_by_count":19},{"year":2018,"cited_by_count":23},{"year":2017,"cited_by_count":20},{"year":2016,"cited_by_count":27},{"year":2015,"cited_by_count":26},{"year":2014,"cited_by_count":14},{"year":2013,"cited_by_count":17},{"year":2012,"cited_by_count":6}],"updated_date":"2024-12-31T11:57:21.794672","created_date":"2016-06-24"}