{"id":"https://openalex.org/W2120371291","doi":"https://doi.org/10.1109/hipc.2013.6799102","title":"Speculative dynamic vectorization to assist static vectorization in a HW/SW co-designed environment","display_name":"Speculative dynamic vectorization to assist static vectorization in a HW/SW co-designed environment","publication_year":2013,"publication_date":"2013-12-01","ids":{"openalex":"https://openalex.org/W2120371291","doi":"https://doi.org/10.1109/hipc.2013.6799102","mag":"2120371291"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/hipc.2013.6799102","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.pure.ed.ac.uk/ws/files/24271857/HiPC2013.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017675158","display_name":"Rakesh Kumar","orcid":"https://orcid.org/0000-0001-6306-304X"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Rakesh Kumar","raw_affiliation_strings":["Dept. of Comput. Archit., Univ. Politec. de Catalunya, Barcelona, Spain"],"affiliations":[{"raw_affiliation_string":"Dept. of Comput. Archit., Univ. Politec. de Catalunya, Barcelona, Spain","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100731047","display_name":"A. Mart\u00ednez","orcid":"https://orcid.org/0000-0001-8292-0377"},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alejandro Martinez","raw_affiliation_strings":["Intel Labs., Intel Barcelona Res. Center, Barcelona, Spain"],"affiliations":[{"raw_affiliation_string":"Intel Labs., Intel Barcelona Res. Center, Barcelona, Spain","institution_ids":["https://openalex.org/I1343180700"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100733331","display_name":"Antonio Gonz\u00e1lez","orcid":"https://orcid.org/0000-0002-0009-0996"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Antonio Gonzalez","raw_affiliation_strings":["Dept. of Comput. Archit., Univ. Politec. de Catalunya, Barcelona, Spain"],"affiliations":[{"raw_affiliation_string":"Dept. of Comput. Archit., Univ. Politec. de Catalunya, Barcelona, Spain","institution_ids":["https://openalex.org/I9617848"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.947,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":8,"citation_normalized_percentile":{"value":0.546685,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":83,"max":84},"biblio":{"volume":null,"issue":null,"first_page":"79","last_page":"88"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9968,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9957,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.94500077},{"id":"https://openalex.org/keywords/dependence-analysis","display_name":"Dependence analysis","score":0.4687562},{"id":"https://openalex.org/keywords/compile-time","display_name":"Compile time","score":0.43511376}],"concepts":[{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.94500077},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.83584017},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.74744874},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7203637},{"id":"https://openalex.org/C150202949","wikidata":"https://www.wikidata.org/wiki/Q107602","display_name":"Pointer (user interface)","level":2,"score":0.5749775},{"id":"https://openalex.org/C27390822","wikidata":"https://www.wikidata.org/wiki/Q320724","display_name":"Dependence analysis","level":2,"score":0.4687562},{"id":"https://openalex.org/C200833197","wikidata":"https://www.wikidata.org/wiki/Q333707","display_name":"Compile time","level":3,"score":0.43511376},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2941829},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.18364307}],"mesh":[],"locations_count":3,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/hipc.2013.6799102","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://www.pure.ed.ac.uk/ws/files/24271857/HiPC2013.pdf","pdf_url":"https://www.pure.ed.ac.uk/ws/files/24271857/HiPC2013.pdf","source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":["University of Edinburgh"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false},{"is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/portal/en/publications/speculative-dynamic-vectorization-to-assist-static-vectorization-in-a-hwsw-codesigned-environment(46253c7e-fc72-49a0-b7b2-c375d71969ee).html","pdf_url":"https://www.research.ed.ac.uk/files/24271857/HiPC2013.pdf","source":{"id":"https://openalex.org/S4306400320","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":["University of Edinburgh"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://www.pure.ed.ac.uk/ws/files/24271857/HiPC2013.pdf","pdf_url":"https://www.pure.ed.ac.uk/ws/files/24271857/HiPC2013.pdf","source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":["University of Edinburgh"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false},"sustainable_development_goals":[{"score":0.64,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, justice, and strong institutions"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":22,"referenced_works":["https://openalex.org/W1495550651","https://openalex.org/W1542196645","https://openalex.org/W1563221445","https://openalex.org/W1966324811","https://openalex.org/W1984972320","https://openalex.org/W2005343162","https://openalex.org/W2013156670","https://openalex.org/W2054103475","https://openalex.org/W2059807497","https://openalex.org/W2092721177","https://openalex.org/W2100543364","https://openalex.org/W2111394443","https://openalex.org/W2122963045","https://openalex.org/W2127594310","https://openalex.org/W2143375055","https://openalex.org/W2143964612","https://openalex.org/W2148865465","https://openalex.org/W3145750999","https://openalex.org/W4237444170","https://openalex.org/W4247793638","https://openalex.org/W4251500183","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W3006505070","https://openalex.org/W2979513934","https://openalex.org/W2767298477","https://openalex.org/W2382449560","https://openalex.org/W2371266106","https://openalex.org/W2351155539","https://openalex.org/W2117864619","https://openalex.org/W2117382851","https://openalex.org/W2110432562","https://openalex.org/W2013156670"],"abstract_inverted_index":{"Compiler":[0],"based":[1,25],"static":[2,82,149],"vectorization":[3,17,37,69,83,99,109,122,140,150,156,162,175],"is":[4,18,158],"used":[5],"widely":[6],"to":[7,30,51,79,107,120,147],"extract":[8],"data":[9],"level":[10],"parallelism":[11],"from":[12],"computation":[13],"intensive":[14],"applications.":[15,26,43,179],"Static":[16],"very":[19],"effective":[20,160],"in":[21,40,67,89,127,161,177],"vectorizing":[22],"traditional":[23],"array":[24],"However,":[27],"compilers":[28,172],"inability":[29],"reorder":[31],"ambiguous":[32,104],"memory":[33,105,116],"references":[34,106],"severely":[35],"limits":[36],"opportunities,":[38],"especially":[39],"pointer":[41],"rich":[42],"HW/SW":[44,91],"co-designed":[45],"processors":[46],"provide":[47],"an":[48],"excellent":[49],"opportunity":[50],"optimize":[52],"the":[53,74,81,135,148,168],"applications":[54,165],"at":[55,63],"runtime.":[56],"The":[57,111],"availability":[58],"of":[59,129,163],"dynamic":[60,87,98,155],"application":[61],"behavior":[62],"runtime":[64],"will":[65],"help":[66],"capturing":[68],"opportunities":[70,176],"generally":[71],"missed":[72],"by":[73],"compilers.":[75],"This":[76],"paper":[77],"proposes":[78],"complement":[80],"with":[84],"a":[85,90,96],"speculative":[86,97,121],"vectorizer":[88],"co-design":[92],"processor.":[93],"We":[94],"present":[95],"algorithm":[100],"that":[101,134],"speculatively":[102],"reorders":[103],"uncover":[108],"opportunities.":[110],"hardware":[112],"checks":[113],"for":[114,152,167],"any":[115],"dependence":[117],"violation":[118],"due":[119],"and":[123],"takes":[124],"corrective":[125],"action":[126],"case":[128],"violation.":[130],"Our":[131],"experiments":[132],"show":[133],"combined":[136],"(static":[137],"+":[138],"dynamic)":[139],"approach":[141],"provides":[142],"2x":[143],"performance":[144],"benefit":[145],"compared":[146],"alone,":[151],"SPECFP2006.":[153],"Moreover,":[154],"scheme":[157],"as":[159,166],"pointer-based":[164,178],"array-based":[169],"ones,":[170],"whereas":[171],"lose":[173],"significant":[174]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2120371291","counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2014,"cited_by_count":4}],"updated_date":"2025-01-15T01:03:57.782293","created_date":"2016-06-24"}