{"id":"https://openalex.org/W2737762472","doi":"https://doi.org/10.1145/3079758","title":"Throughput-Optimized FPGA Accelerator for Deep Convolutional Neural Networks","display_name":"Throughput-Optimized FPGA Accelerator for Deep Convolutional Neural Networks","publication_year":2017,"publication_date":"2017-07-19","ids":{"openalex":"https://openalex.org/W2737762472","doi":"https://doi.org/10.1145/3079758","mag":"2737762472"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3079758","pdf_url":null,"source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100415093","display_name":"Zhi-Qiang Liu","orcid":"https://orcid.org/0000-0002-1883-2871"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiqiang Liu","raw_affiliation_strings":["National University of Defense Technology, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, Hunan, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051680867","display_name":"Yong Dou","orcid":"https://orcid.org/0000-0002-1256-8934"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Dou","raw_affiliation_strings":["National University of Defense Technology, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, Hunan, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069310600","display_name":"Jingfei Jiang","orcid":"https://orcid.org/0000-0002-7103-8650"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingfei Jiang","raw_affiliation_strings":["National University of Defense Technology, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, Hunan, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088703563","display_name":"Jinwei Xu","orcid":"https://orcid.org/0000-0003-1242-4217"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinwei Xu","raw_affiliation_strings":["National University of Defense Technology, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, Hunan, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101782032","display_name":"Shijie Li","orcid":"https://orcid.org/0000-0002-0529-0057"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shijie Li","raw_affiliation_strings":["National University of Defense Technology, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, Hunan, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115076610","display_name":"Yongmei Zhou","orcid":"https://orcid.org/0000-0003-2661-3078"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongmei Zhou","raw_affiliation_strings":["National University of Defense Technology, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, Hunan, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052219010","display_name":"Yingnan Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingnan Xu","raw_affiliation_strings":["National University of Defense Technology, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, Hunan, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":7.146,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":96,"citation_normalized_percentile":{"value":0.999933,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"10","issue":"3","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.999,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9983,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reconfigurability","display_name":"Reconfigurability","score":0.7732565},{"id":"https://openalex.org/keywords/memory-footprint","display_name":"Memory footprint","score":0.6052822},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.5558428},{"id":"https://openalex.org/keywords/design-space-exploration","display_name":"Design space exploration","score":0.43838084},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.4217423}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8970436},{"id":"https://openalex.org/C2780149590","wikidata":"https://www.wikidata.org/wiki/Q7302742","display_name":"Reconfigurability","level":2,"score":0.7732565},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.68340707},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.6762281},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.625439},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.6052822},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.5574802},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.5558428},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5177576},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4675229},{"id":"https://openalex.org/C2776221188","wikidata":"https://www.wikidata.org/wiki/Q21072556","display_name":"Design space exploration","level":2,"score":0.43838084},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.43183383},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.4217423},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.4166251},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.4097039},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.35444003},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.34769738},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2374331},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.12667617},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3079758","pdf_url":null,"source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.9}],"grants":[{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"U1435219, 61303070, 61402507 and 61402499"}],"datasets":[],"versions":[],"referenced_works_count":23,"referenced_works":["https://openalex.org/W1950136256","https://openalex.org/W1963882359","https://openalex.org/W1990315422","https://openalex.org/W1995562189","https://openalex.org/W2009832130","https://openalex.org/W2016053056","https://openalex.org/W2048266589","https://openalex.org/W2062118960","https://openalex.org/W2094756095","https://openalex.org/W2097117768","https://openalex.org/W2102605133","https://openalex.org/W2117130368","https://openalex.org/W2135252045","https://openalex.org/W2161591461","https://openalex.org/W2162931300","https://openalex.org/W2163605009","https://openalex.org/W2265846598","https://openalex.org/W2276486856","https://openalex.org/W2294282016","https://openalex.org/W2308045930","https://openalex.org/W2499811908","https://openalex.org/W2560674852","https://openalex.org/W2952899695"],"related_works":["https://openalex.org/W4386302689","https://openalex.org/W4293243607","https://openalex.org/W4285429137","https://openalex.org/W3195471267","https://openalex.org/W3193699965","https://openalex.org/W3133116121","https://openalex.org/W3032310658","https://openalex.org/W2971009090","https://openalex.org/W2625058759","https://openalex.org/W2068996722"],"abstract_inverted_index":{"Deep":[0],"convolutional":[1],"neural":[2],"networks":[3],"(CNNs)":[4],"have":[5,86],"gained":[6],"great":[7],"success":[8],"in":[9,52,126],"various":[10],"computer":[11],"vision":[12],"applications.":[13],"State-of-the-art":[14],"CNN":[15,91,110],"models":[16],"for":[17,141],"large-scale":[18,53],"applications":[19],"are":[20,28],"computation":[21,66,102],"intensive":[22],"and":[23,37,80,104,162,177,194,204],"memory":[24,106,160],"expensive":[25],"and,":[26],"hence,":[27],"mainly":[29],"processed":[30],"on":[31,179],"high-performance":[32],"processors":[33],"like":[34],"server":[35],"CPUs":[36],"GPUs.":[38],"However,":[39],"there":[40],"is":[41,118,191],"an":[42,98],"increasing":[43],"demand":[44],"of":[45,63,77,101,108,124,187],"high-accuracy":[46],"or":[47,55,68],"real-time":[48],"object":[49],"detection":[50],"tasks":[51],"clusters":[54],"embedded":[56],"systems,":[57],"which":[58,200],"requires":[59],"energy-efficient":[60],"accelerators":[61,190],"because":[62],"the":[64,69,75,105,142,150,168,188,202],"green":[65],"requirement":[67],"limited":[70],"battery":[71],"restriction.":[72],"Due":[73],"to":[74,139],"advantages":[76],"energy":[78],"efficiency":[79],"reconfigurability,":[81],"Field-Programmable":[82],"Gate":[83],"Arrays":[84],"(FPGAs)":[85],"been":[87],"widely":[88],"explored":[89],"as":[90,154],"accelerators.":[92],"In":[93],"this":[94],"article,":[95],"we":[96,166],"present":[97],"in-depth":[99],"analysis":[100],"complexity":[103],"footprint":[107],"each":[109],"layer":[111],"type.":[112],"Then":[113],"a":[114,133,180],"scalable":[115],"parallel":[116],"framework":[117],"proposed":[119],"that":[120,145],"exploits":[121],"four":[122],"levels":[123],"parallelism":[125],"hardware":[127],"acceleration.":[128],"We":[129],"further":[130],"put":[131],"forward":[132],"systematic":[134],"design":[135],"space":[136],"exploration":[137],"methodology":[138,169],"search":[140],"optimal":[143],"solution":[144],"maximizes":[146],"accelerator":[147],"throughput":[148],"under":[149,196],"FPGA":[151],"constraints":[152],"such":[153],"on-chip":[155],"memory,":[156],"computational":[157],"resources,":[158],"external":[159],"bandwidth,":[161],"clock":[163],"frequency.":[164],"Finally,":[165],"demonstrate":[167],"by":[170],"optimizing":[171],"three":[172,189],"representative":[173],"CNNs":[174],"(LeNet,":[175],"AlexNet,":[176],"VGG-S)":[178],"Xilinx":[181],"VC709":[182],"board.":[183],"The":[184],"average":[185],"performance":[186],"424.7,":[192],"445.6,":[193],"473.4GOP/s":[195],"100MHz":[197],"working":[198],"frequency,":[199],"outperforms":[201],"CPU":[203],"previous":[205],"work":[206],"significantly.":[207]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2737762472","counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":11},{"year":2021,"cited_by_count":16},{"year":2020,"cited_by_count":24},{"year":2019,"cited_by_count":14},{"year":2018,"cited_by_count":19},{"year":2017,"cited_by_count":2}],"updated_date":"2024-12-18T02:48:11.280343","created_date":"2017-07-31"}