{"id":"https://openalex.org/W1632742330","doi":"https://doi.org/10.1109/ijcnn.2015.7280511","title":"Optimized deep belief networks on CUDA GPUs","display_name":"Optimized deep belief networks on CUDA GPUs","publication_year":2015,"publication_date":"2015-07-01","ids":{"openalex":"https://openalex.org/W1632742330","doi":"https://doi.org/10.1109/ijcnn.2015.7280511","mag":"1632742330"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2015.7280511","pdf_url":null,"source":{"id":"https://openalex.org/S4363607707","display_name":"2022 International Joint Conference on Neural Networks (IJCNN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100416739","display_name":"Teng Li","orcid":"https://orcid.org/0000-0002-5621-7351"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"funder","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"None Teng Li","raw_affiliation_strings":["National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051680867","display_name":"Yong Dou","orcid":"https://orcid.org/0000-0002-1256-8934"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"funder","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"None Yong Dou","raw_affiliation_strings":["National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047572387","display_name":"Jingfei Jiang","orcid":"https://orcid.org/0000-0003-2668-3228"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"funder","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"None Jingfei Jiang","raw_affiliation_strings":["National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015493306","display_name":"Yueqing Wang","orcid":"https://orcid.org/0000-0002-8734-8346"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"funder","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"None Yueqing Wang","raw_affiliation_strings":["National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109884886","display_name":"Qi Lv","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"funder","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"None Qi Lv","raw_affiliation_strings":["National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory for Parallel & Distributed Processing, National University of Defense and Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.303,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":12,"citation_normalized_percentile":{"value":0.735443,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":87,"max":88},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/deep-belief-network","display_name":"Deep belief network","score":0.860839},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.5225677},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.48756546},{"id":"https://openalex.org/keywords/graphics-processing-unit","display_name":"Graphics processing unit","score":0.47677165},{"id":"https://openalex.org/keywords/gpu-cluster","display_name":"GPU cluster","score":0.44608158}],"concepts":[{"id":"https://openalex.org/C97385483","wikidata":"https://www.wikidata.org/wiki/Q16954980","display_name":"Deep belief network","level":3,"score":0.860839},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8504052},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.85018486},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.63445127},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.625607},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.5585819},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5535835},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.5231344},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.5225677},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.50054145},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.48756546},{"id":"https://openalex.org/C2779851693","wikidata":"https://www.wikidata.org/wiki/Q183484","display_name":"Graphics processing unit","level":2,"score":0.47677165},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44999045},{"id":"https://openalex.org/C2781335571","wikidata":"https://www.wikidata.org/wiki/Q2633544","display_name":"GPU cluster","level":3,"score":0.44608158},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.41561347},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.33059275},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.2020745},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.19344541},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.097197056},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2015.7280511","pdf_url":null,"source":{"id":"https://openalex.org/S4363607707","display_name":"2022 International Joint Conference on Neural Networks (IJCNN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":19,"referenced_works":["https://openalex.org/W1528905581","https://openalex.org/W1973445088","https://openalex.org/W1992245639","https://openalex.org/W1993882792","https://openalex.org/W2005992036","https://openalex.org/W2019779527","https://openalex.org/W2038181916","https://openalex.org/W2072128103","https://openalex.org/W2108948681","https://openalex.org/W2116064496","https://openalex.org/W2120432001","https://openalex.org/W2141778357","https://openalex.org/W2166682639","https://openalex.org/W2914484425","https://openalex.org/W2951488730","https://openalex.org/W4231109964","https://openalex.org/W4238404964","https://openalex.org/W4301861531","https://openalex.org/W44815768"],"related_works":["https://openalex.org/W4317790246","https://openalex.org/W4211066045","https://openalex.org/W2992303576","https://openalex.org/W2598944200","https://openalex.org/W2559348759","https://openalex.org/W2346971659","https://openalex.org/W2163816448","https://openalex.org/W2057093945","https://openalex.org/W2056717482","https://openalex.org/W1936382095"],"abstract_inverted_index":{"A":[0],"deep":[1,10],"belief":[2],"network":[3],"(DBN)":[4],"is":[5,42,140],"an":[6,84],"important":[7],"branch":[8],"of":[9,36,38,58,62,77,137,144],"learning":[11,21],"models":[12],"and":[13,22,30,94,119,151],"has":[14],"been":[15],"successfully":[16],"applied":[17],"in":[18,40],"many":[19],"machine":[20],"pattern":[23],"recognition":[24],"fields":[25],"such":[26],"as":[27],"computer":[28],"vision":[29],"speech":[31],"recognition.":[32],"However,":[33],"the":[34,55,59,74,89,92,105,116,123,135,145,149,152,156],"training":[35],"billions":[37],"parameters":[39],"DBN":[41,86],"computationally":[43],"challenging":[44],"for":[45,64],"modern":[46],"central":[47],"processing":[48,66],"units":[49,67],"(CPUs).":[50],"Many":[51],"studies":[52,71],"have":[53,72],"reported":[54],"efficient":[56,85],"implementations":[57],"pre-training":[60,93,117],"process":[61,76,118],"DBNs":[63],"graphics":[65],"(GPUs),":[68],"but":[69],"few":[70],"mentioned":[73],"fine-tuning":[75,95,124],"DBNs.":[78],"In":[79],"this":[80],"paper,":[81],"we":[82],"describe":[83],"implementation":[87],"on":[88,104,115,122,148,155],"GPU,":[90],"including":[91],"processes.":[96],"Experimental":[97],"results":[98],"show":[99],"that":[100,143],"our":[101,138],"proposed":[102],"method":[103],"GPU":[106],"(NVIDIA":[107],"Tesla":[108],"K40c)":[109],"achieves":[110],"up":[111],"to":[112,142],"22":[113],"speedups":[114,121],"33":[120],"processes":[125],"compared":[126],"with":[127],"conventional":[128],"CPU":[129,150],"(Intel":[130],"Core":[131],"i7-4790K)":[132],"implementations.":[133],"Moreover,":[134],"performance":[136],"algorithm":[139],"superior":[141],"OpenBLAS":[146],"library":[147,154],"CUBLAS":[153],"GPU.":[157]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W1632742330","counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":2}],"updated_date":"2025-04-22T13:02:20.410166","created_date":"2016-06-24"}