{"id":"https://openalex.org/W4394951281","doi":"https://doi.org/10.1109/tpds.2024.3391254","title":"Efficient Utilization of Multi-Threading Parallelism on Heterogeneous Systems for Sparse Tensor Contraction","display_name":"Efficient Utilization of Multi-Threading Parallelism on Heterogeneous Systems for Sparse Tensor Contraction","publication_year":2024,"publication_date":"2024-04-19","ids":{"openalex":"https://openalex.org/W4394951281","doi":"https://doi.org/10.1109/tpds.2024.3391254"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2024.3391254","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107094004","display_name":"Guoqing Xiao","orcid":"https://orcid.org/0000-0001-5008-4829"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"funder","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"funder","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guoqing Xiao","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","Shenzhen Institute, Hunan University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institute, Hunan University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I16609230"]},{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051624512","display_name":"Chuanghui Yin","orcid":null},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"funder","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chuanghui Yin","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035942362","display_name":"Yuedan Chen","orcid":"https://orcid.org/0000-0001-5665-268X"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"funder","lineage":["https://openalex.org/I139660479"]},{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"funder","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"funder","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuedan Chen","raw_affiliation_strings":["Big Data Institute, Central South University, Changsha, China","Shenzhen Institute, Hunan University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Big Data Institute, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]},{"raw_affiliation_string":"Shenzhen Institute, Hunan University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090246160","display_name":"Mingxing Duan","orcid":"https://orcid.org/0000-0002-1049-6244"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"funder","lineage":["https://openalex.org/I16609230"]},{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"funder","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingxing Duan","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","Shenzhen Institute, Hunan University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"Shenzhen Institute, Hunan University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I16609230"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078793726","display_name":"Kenli Li","orcid":"https://orcid.org/0000-0002-2635-7716"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"funder","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kenli Li","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.012,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.996599,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":88,"max":92},"biblio":{"volume":"35","issue":"6","first_page":"1044","last_page":"1055"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9941,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/threading","display_name":"Threading (protein sequence)","score":0.5532585}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7621899},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6583117},{"id":"https://openalex.org/C163415756","wikidata":"https://www.wikidata.org/wiki/Q126473","display_name":"Contraction (grammar)","level":2,"score":0.5951475},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5617119},{"id":"https://openalex.org/C200307862","wikidata":"https://www.wikidata.org/wiki/Q7797175","display_name":"Threading (protein sequence)","level":3,"score":0.5532585},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.48784566},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.4239934},{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.41668212},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.4133213},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.31564245},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.13069248},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.0},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C46141821","wikidata":"https://www.wikidata.org/wiki/Q209402","display_name":"Nuclear magnetic resonance","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2024.3391254","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":44,"referenced_works":["https://openalex.org/W1511885491","https://openalex.org/W1993079359","https://openalex.org/W2006973305","https://openalex.org/W2034669281","https://openalex.org/W2038198231","https://openalex.org/W2054658678","https://openalex.org/W2061014792","https://openalex.org/W2089196182","https://openalex.org/W2089349245","https://openalex.org/W2103392911","https://openalex.org/W2108138101","https://openalex.org/W2127226421","https://openalex.org/W2143119605","https://openalex.org/W2234552091","https://openalex.org/W2411765360","https://openalex.org/W2444009674","https://openalex.org/W2544822491","https://openalex.org/W2582107166","https://openalex.org/W2592422147","https://openalex.org/W2731053425","https://openalex.org/W2788854599","https://openalex.org/W2802696077","https://openalex.org/W2891431244","https://openalex.org/W2893530532","https://openalex.org/W2902783593","https://openalex.org/W2971508019","https://openalex.org/W2979740536","https://openalex.org/W2985039650","https://openalex.org/W2986686333","https://openalex.org/W2990601900","https://openalex.org/W2999353654","https://openalex.org/W3003516456","https://openalex.org/W3016735325","https://openalex.org/W3020586295","https://openalex.org/W3022452999","https://openalex.org/W3036899338","https://openalex.org/W3037114422","https://openalex.org/W3093682587","https://openalex.org/W3101321165","https://openalex.org/W3104098743","https://openalex.org/W3131379896","https://openalex.org/W3170905359","https://openalex.org/W4248445937","https://openalex.org/W4287254515"],"related_works":["https://openalex.org/W4400094300","https://openalex.org/W3214280620","https://openalex.org/W3191490922","https://openalex.org/W2794038527","https://openalex.org/W2765823764","https://openalex.org/W2384867379","https://openalex.org/W2329539859","https://openalex.org/W2327638088","https://openalex.org/W2227905990","https://openalex.org/W1554180614"],"abstract_inverted_index":{"Many":[0],"fields":[1],"of":[2,20,39,96,155],"scientific":[3],"simulation,":[4],"such":[5],"as":[6],"chemistry":[7],"and":[8,42,76,91,110,139],"condensed":[9],"matter":[10],"physics,":[11],"are":[12],"increasingly":[13],"eschewing":[14],"dense":[15],"tensor":[16,22,32,72,121],"contraction":[17,33,108,122],"in":[18,119],"favor":[19],"sparse":[21,31,120],"contraction.":[23,73],"In":[24,98],"this":[25],"work,":[26],"we":[27,48,82],"center":[28],"around":[29],"binary":[30],"(SpTC)":[34],"which":[35,113],"has":[36],"the":[37,86,93,107,116,132,137,140,159],"challenges":[38],"index":[40],"matching":[41],"accumulation.":[43],"To":[44],"address":[45],"these":[46],"difficulties,":[47],"present":[49],"GSpTC,":[50],"an":[51,151],"efficient":[52],"element-":[53,70],"wise":[54,71],"SpTC":[55],"framework":[56,162],"on":[57,69,89,104],"CPU-GPU":[58],"heterogeneous":[59],"systems.":[60],"GSpTC":[61,100,125,149],"first":[62],"introduces":[63],"a":[64,147],"fine-grained":[65],"partitioning":[66,80],"strategy":[67],"based":[68],"By":[74],"analyzing":[75],"selecting":[77],"appropriate":[78],"dimension":[79],"strategies,":[81],"can":[83],"efficiently":[84],"utilize":[85],"multi-threading":[87,102],"parallelism":[88,103],"GPUs":[90,105],"optimize":[92],"overall":[94],"performance":[95,153],"GSpTC.":[97],"particular,":[99],"leverages":[101],"for":[106],"phase":[109,118],"merging":[111],"phase,":[112],"greatly":[114],"accelerates":[115],"computation":[117],"computations.":[123],"Furthermore,":[124],"employs":[126],"parallel":[127],"pipeline":[128],"technology":[129],"to":[130,158],"hide":[131],"data":[133],"transmission":[134],"time":[135],"between":[136],"host":[138],"device,":[141],"further":[142],"enhancing":[143],"its":[144],"performance.":[145],"As":[146],"result,":[148],"achieves":[150],"average":[152],"improvement":[154],"267%":[156],"compared":[157],"previous":[160],"state-of-the-art":[161],"Sparta.":[163]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4394951281","counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2025-04-22T20:10:42.810010","created_date":"2024-04-20"}