{"id":"https://openalex.org/W4321636552","doi":"https://doi.org/10.1109/sc41404.2022.00074","title":"QoS-Aware Irregular Collaborative Inference for Improving Throughput of DNN Services","display_name":"QoS-Aware Irregular Collaborative Inference for Improving Throughput of DNN Services","publication_year":2022,"publication_date":"2022-11-01","ids":{"openalex":"https://openalex.org/W4321636552","doi":"https://doi.org/10.1109/sc41404.2022.00074"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/sc41404.2022.00074","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037447327","display_name":"Kaihua Fu","orcid":"https://orcid.org/0000-0001-5117-7162"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"funder","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaihua Fu","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020345102","display_name":"Jiuchen Shi","orcid":"https://orcid.org/0000-0002-5470-210X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"funder","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiuchen Shi","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100377840","display_name":"Quan Chen","orcid":"https://orcid.org/0000-0001-5832-0347"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"funder","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Quan Chen","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018118687","display_name":"Ningxin Zheng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"funder","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ningxin Zheng","raw_affiliation_strings":["Microsoft Research Asia, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Shanghai, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100756628","display_name":"Wei Zhang","orcid":"https://orcid.org/0000-0001-5556-3896"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"funder","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Zhang","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077093242","display_name":"Deze Zeng","orcid":"https://orcid.org/0000-0003-3276-1202"},"institutions":[{"id":"https://openalex.org/I3124059619","display_name":"China University of Geosciences","ror":"https://ror.org/04gcegc37","country_code":"CN","type":"funder","lineage":["https://openalex.org/I3124059619"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Deze Zeng","raw_affiliation_strings":["China University of Geosciences, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"China University of Geosciences, Wuhan, China","institution_ids":["https://openalex.org/I3124059619"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039318240","display_name":"Minyi Guo","orcid":"https://orcid.org/0000-0003-0034-2302"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"funder","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minyi Guo","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.843,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.374882,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":81,"max":84},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9977,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9977,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9964,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10080","display_name":"Energy Efficient Wireless Sensor Networks","score":0.9952,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.45595717}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8042773},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.65760434},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.6189723},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.60279936},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.6025728},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.46561956},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.45707685},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.45595717},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.44899386},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.42166415},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.4130572},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33831942},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.32518145},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16969389},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.15735066},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1459217},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C136264566","wikidata":"https://www.wikidata.org/wiki/Q159810","display_name":"Economy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/sc41404.2022.00074","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"61832006,62022057"}],"datasets":[],"versions":[],"referenced_works_count":33,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1981055536","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2394932179","https://openalex.org/W2577255746","https://openalex.org/W2605258629","https://openalex.org/W2607041014","https://openalex.org/W2734941459","https://openalex.org/W2798291715","https://openalex.org/W2892952080","https://openalex.org/W2896457183","https://openalex.org/W2926143647","https://openalex.org/W2931122162","https://openalex.org/W2982157693","https://openalex.org/W2984200518","https://openalex.org/W3005664618","https://openalex.org/W3038006402","https://openalex.org/W3083715619","https://openalex.org/W3105381414","https://openalex.org/W3130716829","https://openalex.org/W3133171930","https://openalex.org/W3153345798","https://openalex.org/W3158444059","https://openalex.org/W3208777667","https://openalex.org/W4200091031","https://openalex.org/W4200542591","https://openalex.org/W4214540558","https://openalex.org/W4280633999","https://openalex.org/W4282968244","https://openalex.org/W4286900001","https://openalex.org/W4293584584","https://openalex.org/W4297808460"],"related_works":["https://openalex.org/W4386004629","https://openalex.org/W4381489698","https://openalex.org/W4366999913","https://openalex.org/W4313339048","https://openalex.org/W4281678247","https://openalex.org/W3201779876","https://openalex.org/W3176734149","https://openalex.org/W3162668736","https://openalex.org/W3014007418","https://openalex.org/W3013760193"],"abstract_inverted_index":{"With":[0],"collaborative":[1,54],"DNN":[2],"inference,":[3],"part":[4],"of":[5,81,133],"queries":[6,32,82,96,102,115],"run":[7,27,116],"on":[8,28,33,84,104,121,138],"their":[9,105],"source":[10],"edge":[11],"device":[12],"to":[13,45,119],"reduce":[14],"latencies.":[15],"Because":[16],"edges":[17],"show":[18,36,125],"diverse":[19],"performance":[20,87],"and":[21,31,71,88,98],"network":[22,89],"conditions,":[23],"different":[24,29],"layers":[25],"should":[26],"devices,":[30],"the":[34,79,85,100,111,122,129,134,142],"datacenter":[35,135],"irregular":[37,48,61,95,101],"structures.":[38],"However,":[39],"emerging":[40],"schemes":[41],"are":[42],"not":[43],"able":[44],"process":[46],"such":[47],"queries.":[49,62],"We":[50],"propose":[51],"ICE,":[52],"a":[53,65,68,72],"inference":[55],"service":[56],"scheme":[57],"that":[58,126],"effectively":[59],"supports":[60],"ICE":[63,127],"comprises":[64],"query":[66,69,76,92],"slicer,":[67],"manager,":[70],"lag":[73,108],"enhancer.":[74],"The":[75,91,107],"slicer":[77],"maps":[78],"execution":[80],"based":[83,103],"edges'":[86],"conditions.":[90],"manager":[93],"batches":[94],"adaptively":[97],"schedules":[99],"progress.":[106],"enhancer":[109],"reduces":[110],"QoS":[112],"violation":[113],"when":[114],"slower":[117],"due":[118],"interference":[120],"edge.":[123],"Experiments":[124],"improves":[128],"supported":[130],"peak":[131],"load":[132],"by":[136],"43.2%":[137],"average":[139],"while":[140],"guaranteeing":[141],"required":[143],"99%-ile":[144],"latencies":[145],"compared":[146],"with":[147],"state-of-the-art":[148],"techniques.":[149]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4321636552","counts_by_year":[{"year":2023,"cited_by_count":5}],"updated_date":"2025-04-17T07:06:39.566685","created_date":"2023-02-24"}