{"id":"https://openalex.org/W2095909712","doi":"https://doi.org/10.1177/1094342014526907","title":"Analyzing power efficiency of optimization techniques and algorithm design methods for applications on heterogeneous platforms","display_name":"Analyzing power efficiency of optimization techniques and algorithm design methods for applications on heterogeneous platforms","publication_year":2014,"publication_date":"2014-03-21","ids":{"openalex":"https://openalex.org/W2095909712","doi":"https://doi.org/10.1177/1094342014526907","mag":"2095909712"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1177/1094342014526907","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019687323","display_name":"Yash Ukidave","orcid":null},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yash Ukidave","raw_affiliation_strings":["[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]"],"affiliations":[{"raw_affiliation_string":"[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]","institution_ids":["https://openalex.org/I12912129"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021996030","display_name":"Amir Kavyan Ziabari","orcid":"https://orcid.org/0000-0002-5963-2374"},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amir Kavyan Ziabari","raw_affiliation_strings":["[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]"],"affiliations":[{"raw_affiliation_string":"[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]","institution_ids":["https://openalex.org/I12912129"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038365055","display_name":"Perhaad Mistry","orcid":null},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Perhaad Mistry","raw_affiliation_strings":["[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]"],"affiliations":[{"raw_affiliation_string":"[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]","institution_ids":["https://openalex.org/I12912129"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026700236","display_name":"Gunar Schirner","orcid":"https://orcid.org/0000-0002-5408-8496"},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gunar Schirner","raw_affiliation_strings":["[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]"],"affiliations":[{"raw_affiliation_string":"[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]","institution_ids":["https://openalex.org/I12912129"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061128237","display_name":"David Kaeli","orcid":"https://orcid.org/0000-0002-5692-0151"},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Kaeli","raw_affiliation_strings":["[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]"],"affiliations":[{"raw_affiliation_string":"[Department of Electrical and computer Engineering, Northeastern University, Boston, MA, USA]","institution_ids":["https://openalex.org/I12912129"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.391,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":8,"citation_normalized_percentile":{"value":0.799494,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":84,"max":85},"biblio":{"volume":"28","issue":"3","first_page":"319","last_page":"334"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.998,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/loop-unrolling","display_name":"Loop unrolling","score":0.73790437},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.50921905},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.46698993}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8367196},{"id":"https://openalex.org/C76970557","wikidata":"https://www.wikidata.org/wiki/Q1869750","display_name":"Loop unrolling","level":3,"score":0.73790437},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6198403},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5328738},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.52909374},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.50921905},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.5018127},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.46698993},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.44892356},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3482734},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.114599854},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.11201736},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1177/1094342014526907","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.91,"id":"https://metadata.un.org/sdg/7"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":36,"referenced_works":["https://openalex.org/W1597508330","https://openalex.org/W1717365219","https://openalex.org/W1903794615","https://openalex.org/W1976534780","https://openalex.org/W1978969737","https://openalex.org/W1979527452","https://openalex.org/W1992851788","https://openalex.org/W2000335122","https://openalex.org/W2002555321","https://openalex.org/W2024874287","https://openalex.org/W2047532956","https://openalex.org/W2066804546","https://openalex.org/W2102182691","https://openalex.org/W2103742924","https://openalex.org/W2108600626","https://openalex.org/W2114927422","https://openalex.org/W2123119012","https://openalex.org/W2123591640","https://openalex.org/W2129136709","https://openalex.org/W2144293278","https://openalex.org/W2146742876","https://openalex.org/W2147193503","https://openalex.org/W2149234156","https://openalex.org/W2149921618","https://openalex.org/W2160245390","https://openalex.org/W2160786443","https://openalex.org/W2161775046","https://openalex.org/W2167334577","https://openalex.org/W2213609752","https://openalex.org/W2295862081","https://openalex.org/W2620440553","https://openalex.org/W2997701623","https://openalex.org/W3145767355","https://openalex.org/W3147878143","https://openalex.org/W4250981202","https://openalex.org/W641086946"],"related_works":["https://openalex.org/W4300144375","https://openalex.org/W4250047567","https://openalex.org/W3214851784","https://openalex.org/W3028831948","https://openalex.org/W2982613029","https://openalex.org/W2344775847","https://openalex.org/W2292897598","https://openalex.org/W2153645222","https://openalex.org/W2128120785","https://openalex.org/W2100501042"],"abstract_inverted_index":{"Graphics":[0],"processing":[1],"units":[2],"(GPUs)":[3],"have":[4,52],"become":[5],"widely":[6],"accepted":[7],"as":[8,26,42,163],"the":[9,32,60,79,90,102,110,114,150,169,245,255,259,269,281],"computing":[10,18],"platform":[11],"of":[12,22,63,93,109,116,184,206,248,258],"choice":[13],"in":[14,56,191,198,204,215,232],"many":[15],"high":[16],"performance":[17,115,247],"domains.":[19],"The":[20,166],"availability":[21],"programming":[23],"standards":[24],"such":[25,41],"OpenCL":[27],"are":[28,74],"used":[29,96],"to":[30,49,76,211,219],"leverage":[31],"inherent":[33],"parallelism":[34],"offered":[35],"by":[36,105,194],"GPUs.":[37],"Source":[38],"code":[39],"optimizations":[40,95,186,242],"loop":[43],"unrolling":[44],"and":[45,136,142,149,159,171,284],"tiling":[46],"when":[47],"targeted":[48],"heterogeneous":[50,83,98,250],"applications":[51],"reported":[53],"large":[54],"gains":[55],"performance.":[57,207],"However,":[58],"given":[59],"power":[61,69,138,178,192,216,256],"consumption":[62,108,193,217,234],"GPUs,":[64,131],"platforms":[65],"can":[66,175,243,274],"exhaust":[67],"their":[68],"budgets":[70],"quickly.":[71],"Better":[72],"solutions":[73],"needed":[75],"effectively":[77],"exploit":[78],"power-efficiency":[80],"available":[81],"on":[82,97,120,280],"systems.":[84],"In":[85],"this":[86],"work,":[87],"we":[88,263],"evaluate":[89],"power/performance":[91,103],"efficiency":[92,257],"different":[94,117,122,236,241,266],"applications.":[99],"We":[100,112,180,208,226,238],"analyze":[101],"trade-off":[104],"evaluating":[106],"energy":[107,233],"optimizations.":[111,237],"compare":[113],"optimization":[118],"techniques":[119],"four":[121],"fast":[123],"Fourier":[124],"transform":[125],"implementations.":[126,225],"Our":[127],"study":[128,167],"covers":[129],"discrete":[130],"shared":[132],"memory":[133],"GPUs":[134],"(APUs)":[135],"low":[137],"system-on-chip":[139],"(SoC)":[140],"devices,":[141],"includes":[143],"hardware":[144,283],"from":[145],"AMD":[146],"(Llano":[147],"APUs":[148],"Southern":[151],"Islands":[152],"GPU),":[153],"Nvidia":[154],"(Kepler),":[155],"Intel":[156],"(Ivy":[157],"Bridge)":[158],"Qualcomm":[160],"(Snapdragon":[161],"S4)":[162],"test":[164],"platforms.":[165],"identifies":[168],"architectural":[170],"algorithmic":[172],"factors":[173],"which":[174,187],"most":[176],"impact":[177,254],"consumption.":[179],"explore":[181],"a":[182,249],"range":[183],"application":[185,286],"show":[188],"an":[189,212,229],"increase":[190,203],"27%,":[195],"but":[196,252],"result":[197],"more":[199],"than":[200],"1.8":[201],"\u00d7":[202],"speed":[205],"observe":[209,228],"up":[210],"18%":[213],"reduction":[214],"due":[218],"reduced":[220],"kernel":[221],"calls":[222],"across":[223],"FFT":[224],"also":[227,253],"11%":[230],"variation":[231],"among":[235],"highlight":[239],"how":[240],"improve":[244],"execution":[246],"application,":[251],"application.":[260],"More":[261],"importantly,":[262],"demonstrate":[264],"that":[265],"algorithms":[267],"implementing":[268],"same":[270],"fundamental":[271],"function":[272],"(FFT)":[273],"perform":[275],"with":[276],"vast":[277],"differences":[278],"based":[279],"target":[282],"associated":[285],"design.":[287]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2095909712","counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2025-01-18T15:05:25.610752","created_date":"2016-06-24"}