{"id":"https://openalex.org/W4386707690","doi":"https://doi.org/10.1145/3605573.3605600","title":"Performance-Aware Energy-Efficient GPU Frequency Selection using DNN-based Models","display_name":"Performance-Aware Energy-Efficient GPU Frequency Selection using DNN-based Models","publication_year":2023,"publication_date":"2023-08-07","ids":{"openalex":"https://openalex.org/W4386707690","doi":"https://doi.org/10.1145/3605573.3605600"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3605573.3605600","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3605573.3605600","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3605573.3605600","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035049481","display_name":"Ghazanfar Ali","orcid":"https://orcid.org/0000-0001-5158-8236"},"institutions":[{"id":"https://openalex.org/I12315562","display_name":"Texas Tech University","ror":"https://ror.org/0405mnx93","country_code":"US","type":"education","lineage":["https://openalex.org/I12315562"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ghazanfar Ali","raw_affiliation_strings":["Computer Science, Texas Tech University, United States of America"],"affiliations":[{"raw_affiliation_string":"Computer Science, Texas Tech University, United States of America","institution_ids":["https://openalex.org/I12315562"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078558721","display_name":"Mert Side","orcid":"https://orcid.org/0000-0002-0815-4763"},"institutions":[{"id":"https://openalex.org/I12315562","display_name":"Texas Tech University","ror":"https://ror.org/0405mnx93","country_code":"US","type":"education","lineage":["https://openalex.org/I12315562"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mert Side","raw_affiliation_strings":["Computer Science, Texas Tech University, United States of America"],"affiliations":[{"raw_affiliation_string":"Computer Science, Texas Tech University, United States of America","institution_ids":["https://openalex.org/I12315562"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057716533","display_name":"Sridutt Bhalachandra","orcid":"https://orcid.org/0000-0003-1084-5683"},"institutions":[{"id":"https://openalex.org/I4210151627","display_name":"National Energy Research Scientific Computing Center","ror":"https://ror.org/05v3mvq14","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521","https://openalex.org/I4210151627"]},{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sridutt Bhalachandra","raw_affiliation_strings":["National Energy Research Scientific Computing Center (NERSC), Lawrence Berkeley National Laboratory, United States of America"],"affiliations":[{"raw_affiliation_string":"National Energy Research Scientific Computing Center (NERSC), Lawrence Berkeley National Laboratory, United States of America","institution_ids":["https://openalex.org/I4210151627","https://openalex.org/I148283060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070066590","display_name":"Nicholas J. Wright","orcid":"https://orcid.org/0000-0003-1883-6108"},"institutions":[{"id":"https://openalex.org/I4210151627","display_name":"National Energy Research Scientific Computing Center","ror":"https://ror.org/05v3mvq14","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521","https://openalex.org/I4210151627"]},{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nicholas J. Wright","raw_affiliation_strings":["National Energy Research Scientific Computing Center (NERSC), Lawrence Berkeley National Laboratory, United States of America"],"affiliations":[{"raw_affiliation_string":"National Energy Research Scientific Computing Center (NERSC), Lawrence Berkeley National Laboratory, United States of America","institution_ids":["https://openalex.org/I4210151627","https://openalex.org/I148283060"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077521546","display_name":"Yong Chen","orcid":"https://orcid.org/0000-0002-9961-9051"},"institutions":[{"id":"https://openalex.org/I12315562","display_name":"Texas Tech University","ror":"https://ror.org/0405mnx93","country_code":"US","type":"education","lineage":["https://openalex.org/I12315562"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yong Chen","raw_affiliation_strings":["Computer Science, Texas Tech University, United States of America"],"affiliations":[{"raw_affiliation_string":"Computer Science, Texas Tech University, United States of America","institution_ids":["https://openalex.org/I12315562"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.394,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":6,"citation_normalized_percentile":{"value":0.999475,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":92,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"433","last_page":"442"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9971,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/software-portability","display_name":"Software portability","score":0.7154609},{"id":"https://openalex.org/keywords/design-space-exploration","display_name":"Design space exploration","score":0.605822},{"id":"https://openalex.org/keywords/spec#","display_name":"Spec#","score":0.48138312},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.46740204}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.84652567},{"id":"https://openalex.org/C63000827","wikidata":"https://www.wikidata.org/wiki/Q3080428","display_name":"Software portability","level":2,"score":0.7154609},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.6623626},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.6161487},{"id":"https://openalex.org/C2776221188","wikidata":"https://www.wikidata.org/wiki/Q21072556","display_name":"Design space exploration","level":2,"score":0.605822},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.5179614},{"id":"https://openalex.org/C2778565505","wikidata":"https://www.wikidata.org/wiki/Q2207566","display_name":"Spec#","level":2,"score":0.48138312},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.46740204},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.44674644},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.44184422},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.44151357},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.43568206},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.43053287},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.41660148},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.41217867},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32950675},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.28943172},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.15102571},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08818245},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3605573.3605600","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3605573.3605600","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3605573.3605600","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3605573.3605600","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.8,"id":"https://metadata.un.org/sdg/7"}],"grants":[{"funder":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation","award_id":"CNS-1817094, OAC-1835892, CNS-1939140"},{"funder":"https://openalex.org/F4320317220","funder_display_name":"National Energy Research Scientific Computing Center","award_id":"DEAC02-05CH11231"}],"datasets":[],"versions":[],"referenced_works_count":24,"referenced_works":["https://openalex.org/W1966078827","https://openalex.org/W2002016471","https://openalex.org/W2038666141","https://openalex.org/W2074084090","https://openalex.org/W2082290707","https://openalex.org/W2154189213","https://openalex.org/W2155470578","https://openalex.org/W2495572165","https://openalex.org/W2499556698","https://openalex.org/W2751343396","https://openalex.org/W2787719654","https://openalex.org/W2808522216","https://openalex.org/W2945969444","https://openalex.org/W2962843187","https://openalex.org/W2984189761","https://openalex.org/W2997591727","https://openalex.org/W3010946599","https://openalex.org/W3037110041","https://openalex.org/W3046751266","https://openalex.org/W3134495297","https://openalex.org/W3201073812","https://openalex.org/W4253793222","https://openalex.org/W4287902686","https://openalex.org/W4308090478"],"related_works":["https://openalex.org/W4365793791","https://openalex.org/W4288420200","https://openalex.org/W4282568311","https://openalex.org/W3145095675","https://openalex.org/W3134072570","https://openalex.org/W2951473296","https://openalex.org/W2883928845","https://openalex.org/W2168940796","https://openalex.org/W2024329643","https://openalex.org/W2016659453"],"abstract_inverted_index":{"Energy":[0],"efficiency":[1],"will":[2],"be":[3],"important":[4],"in":[5],"future":[6],"accelerator-based":[7],"HPC":[8],"systems":[9],"for":[10,27,52,59],"sustainability":[11],"and":[12,30,47,65,82,85,105],"to":[13],"improve":[14],"overall":[15],"performance.":[16],"This":[17],"study":[18],"proposes":[19],"a":[20,60,116],"deep":[21],"neural":[22],"network":[23],"(DNN)-based":[24],"learning":[25],"model":[26,53,140],"execution":[28],"time":[29,86],"power":[31,84,104],"consumption":[32],"of":[33,113,119,130],"workloads":[34],"across":[35,142],"GPUs":[36],"DVFS":[37],"design":[38],"space.":[39],"Micro-architectural":[40],"data":[41,70],"obtained":[42],"by":[43,63],"running":[44],"SPEC-ACCEL,":[45],"DGEMM,":[46],"STREAM":[48],"benchmarks":[49],"are":[50,57],"used":[51],"training.":[54],"These":[55],"features":[56],"consistent":[58],"workload":[61],"unaffected":[62],"frequency":[64],"input":[66],"size":[67],"reducing":[68],"the":[69],"required":[71],"significantly.":[72],"For":[73],"real-world":[74],"applications":[75],"-":[76],"LAMMPS,":[77],"NAMD,":[78],"GROMACS,":[79],"LSTM,":[80],"BERT,":[81],"ResNet50":[83],"models":[87,123],"show":[88],"89%":[89],"\u2013":[90],"98%":[91],"accuracy":[92,129],"on":[93,125,134],"NVIDIA":[94,136],"Ampere.":[95],"Multi-objective":[96],"functions":[97],"help":[98],"select":[99],"optimal":[100],"frequencies":[101],"that":[102],"lower":[103],"minimize":[106],"performance":[107,117],"impact":[108],"showing":[109],"maximum":[110],"energy":[111],"savings":[112],"27%":[114],"at":[115],"loss":[118],"1.8%.":[120],"The":[121],"same":[122],"trained":[124],"Ampere":[126],"showed":[127],"an":[128,135],"greater":[131],"than":[132],"93%":[133],"Volta,":[137],"thereby":[138],"demonstrating":[139],"portability":[141],"architectures.":[143]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4386707690","counts_by_year":[{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1}],"updated_date":"2024-12-12T08:57:13.419881","created_date":"2023-09-14"}