{"id":"https://openalex.org/W2085582906","doi":"https://doi.org/10.1109/pact.2011.48","title":"A Compiler-assisted Runtime-prefetching Scheme for Heterogenous Platforms","display_name":"A Compiler-assisted Runtime-prefetching Scheme for Heterogenous Platforms","publication_year":2011,"publication_date":"2011-10-01","ids":{"openalex":"https://openalex.org/W2085582906","doi":"https://doi.org/10.1109/pact.2011.48","mag":"2085582906"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact.2011.48","pdf_url":null,"source":{"id":"https://openalex.org/S4306419751","display_name":"International Conference on Parallel Architectures and Compilation Techniques","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022872434","display_name":"Baojiang Shou","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Baojiang Shou","raw_affiliation_strings":["ict, Beijing, China#TAB#"],"affiliations":[{"raw_affiliation_string":"ict, Beijing, China#TAB#","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048532222","display_name":"Xionghui Hou","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xionghui Hou","raw_affiliation_strings":["ict, Beijing, China#TAB#"],"affiliations":[{"raw_affiliation_string":"ict, Beijing, China#TAB#","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100379221","display_name":"Li Chen","orcid":"https://orcid.org/0000-0002-2300-6996"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Chen","raw_affiliation_strings":["ict, Beijing, China#TAB#"],"affiliations":[{"raw_affiliation_string":"ict, Beijing, China#TAB#","institution_ids":["https://openalex.org/I19820366"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":65},"biblio":{"volume":null,"issue":null,"first_page":"215","last_page":"215"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8621764},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.7896577},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.75425196},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.69785064},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.5075909},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.4336362},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.42314655},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.4164763},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3590193},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.33266413},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.15958607},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact.2011.48","pdf_url":null,"source":{"id":"https://openalex.org/S4306419751","display_name":"International Conference on Parallel Architectures and Compilation Techniques","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":24,"referenced_works":["https://openalex.org/W1480281982","https://openalex.org/W1537323515","https://openalex.org/W1805440014","https://openalex.org/W1987588924","https://openalex.org/W2007000019","https://openalex.org/W2015935981","https://openalex.org/W2016352575","https://openalex.org/W2032039029","https://openalex.org/W2087085699","https://openalex.org/W2105528986","https://openalex.org/W2109426995","https://openalex.org/W2111354435","https://openalex.org/W2121893797","https://openalex.org/W2129232868","https://openalex.org/W2135518093","https://openalex.org/W2139935536","https://openalex.org/W2142421493","https://openalex.org/W2150476673","https://openalex.org/W2153808006","https://openalex.org/W2159481344","https://openalex.org/W2160875256","https://openalex.org/W2167101788","https://openalex.org/W2399715892","https://openalex.org/W518915"],"related_works":["https://openalex.org/W4240253816","https://openalex.org/W4232954277","https://openalex.org/W3096456556","https://openalex.org/W2979513934","https://openalex.org/W2749133591","https://openalex.org/W2505380084","https://openalex.org/W2367473450","https://openalex.org/W2169584677","https://openalex.org/W2020341030","https://openalex.org/W1979099492"],"abstract_inverted_index":{"GPGPU":[0,33],"has":[1,134],"been":[2,136],"widely":[3,44],"adopted":[4],"by":[5,32,46,138],"industry":[6],"and":[7,20,64,71,77,106,141],"academia.":[8],"For":[9],"real":[10],"applications":[11],"on":[12,84],"industry,":[13],"however,":[14],"the":[15,26,35,78,93,120,131,150],"data":[16,67],"communications":[17,68],"between":[18,69],"CPUs":[19,70],"GPUs":[21],"often":[22],"dramatically":[23],"slow":[24],"down":[25],"overall":[27],"performance.":[28],"Another":[29],"difficulty":[30],"raised":[31],"is":[34,39,55,75,81,102],"programming":[36,42],"productivity.":[37],"OpenMP":[38],"a":[40,59,97,103,107],"high-level":[41],"model":[43],"accepted":[45],"industry.":[47],"A":[48],"software":[49],"distributed":[50],"shared":[51,61],"memory":[52,62],"system":[53,95],"(DSM)":[54],"implemented":[56],"to":[57,65,126],"provide":[58],"logic":[60],"space":[63],"manage":[66],"GPUs.":[72],"The":[73,115,145],"DSM":[74,94],"block-based,":[76],"block":[79],"size":[80],"adjustable":[82],"based":[83],"loop":[85],"partitioning":[86],"parameters.":[87],"In":[88],"this":[89],"work,":[90],"we":[91],"optimize":[92],"using":[96],"compiler-assisted":[98],"data-prefetching":[99],"scheme.":[100],"There":[101],"prefetching":[104,108,116,143,146,151],"thread":[105,117],"worker":[109,147],"for":[110],"each":[111],"sepa":[112],"rated":[113],"memory.":[114],"looks":[118],"into":[119],"future,":[121],"applies":[122],"inter-thread":[123],"use-def":[124],"analysis":[125],"judge":[127],"which":[128],"part":[129],"of":[130],"USE":[132],"region":[133],"already":[135],"generated":[137],"computing":[139],"threads":[140],"produces":[142],"requests.":[144],"carries":[148],"out":[149],"operations.":[152]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2085582906","counts_by_year":[],"updated_date":"2024-12-09T03:30:09.506701","created_date":"2016-06-24"}