{"id":"https://openalex.org/W4404404018","doi":"https://doi.org/10.48550/arxiv.2411.02797","title":"DeepContext: A Context-aware, Cross-platform, and Cross-framework Tool\n for Performance Profiling and Analysis of Deep Learning Workloads","display_name":"DeepContext: A Context-aware, Cross-platform, and Cross-framework Tool\n for Performance Profiling and Analysis of Deep Learning Workloads","publication_year":2024,"publication_date":"2024-11-04","ids":{"openalex":"https://openalex.org/W4404404018","doi":"https://doi.org/10.48550/arxiv.2411.02797"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.02797","pdf_url":"http://arxiv.org/pdf/2411.02797","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2411.02797","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080460539","display_name":"Qidong Zhao","orcid":"https://orcid.org/0000-0001-9123-343X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Qidong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115590135","display_name":"Hao Wu","orcid":"https://orcid.org/0000-0002-6638-169X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100750974","display_name":"Yue Hao","orcid":"https://orcid.org/0000-0002-8081-2919"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hao, Yuming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015949578","display_name":"Z. Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Zilingfeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108050242","display_name":"Jiajia Li","orcid":"https://orcid.org/0000-0001-6743-2797"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jiajia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013747807","display_name":"Xu Liu","orcid":"https://orcid.org/0000-0001-5177-9948"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5063326523","display_name":"Keren Zhou","orcid":"https://orcid.org/0000-0002-7977-3182"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Keren","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":83},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.984,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.984,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9687,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10703","display_name":"Business Process Modeling and Analysis","score":0.9012,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.87965286},{"id":"https://openalex.org/keywords/cross-platform","display_name":"Cross-platform","score":0.6894028},{"id":"https://openalex.org/keywords/cross-validation","display_name":"Cross-validation","score":0.5150542}],"concepts":[{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.87965286},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7168853},{"id":"https://openalex.org/C92400490","wikidata":"https://www.wikidata.org/wiki/Q174666","display_name":"Cross-platform","level":2,"score":0.6894028},{"id":"https://openalex.org/C27181475","wikidata":"https://www.wikidata.org/wiki/Q541014","display_name":"Cross-validation","level":2,"score":0.5150542},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5143188},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4225926},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3891815},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.17679164},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.04728353},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.02797","pdf_url":"http://arxiv.org/pdf/2411.02797","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.02797","pdf_url":"http://arxiv.org/pdf/2411.02797","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W816105089","https://openalex.org/W4387664169","https://openalex.org/W4375867731","https://openalex.org/W4252521128","https://openalex.org/W4231960479","https://openalex.org/W2985540061","https://openalex.org/W2589019771","https://openalex.org/W2185012154","https://openalex.org/W2161444195","https://openalex.org/W1987563485"],"abstract_inverted_index":{"Effective":[0],"performance":[1,39,88,138,148,167],"profiling":[2],"and":[3,10,38,47,86,98,100,108,118,134,150,165,172],"analysis":[4],"are":[5],"essential":[6],"for":[7,42,90,187],"optimizing":[8],"training":[9],"inference":[11],"of":[12,21,83,175],"deep":[13,64,92,176,193],"learning":[14,65,93,177,194],"models,":[15],"especially":[16],"given":[17],"the":[18,30],"growing":[19],"complexity":[20],"heterogeneous":[22],"computing":[23],"environments.":[24,199],"However,":[25],"existing":[26],"tools":[27],"often":[28],"lack":[29],"capability":[31],"to":[32,130,169,190],"provide":[33],"comprehensive":[34],"program":[35,58,151],"context":[36],"information":[37],"optimization":[40,174],"insights":[41],"sophisticated":[43],"interactions":[44],"between":[45],"CPUs":[46],"GPUs.":[48,79],"This":[49],"paper":[50],"introduces":[51],"DeepContext,":[52],"a":[53,124,184],"novel":[54,125],"profiler":[55],"that":[56,127,140],"links":[57],"contexts":[59],"across":[60,196],"high-level":[61],"Python":[62],"code,":[63],"frameworks,":[66,94],"underlying":[67],"libraries":[68],"written":[69],"in":[70],"C/C++,":[71],"as":[72,74,96,110,112],"well":[73,111],"device":[75],"code":[76],"executed":[77],"on":[78,147],"DeepContext":[80,122,160],"incorporates":[81],"measurements":[82],"both":[84,106],"coarse-":[85],"fine-grained":[87],"metrics":[89,149],"major":[91],"such":[95],"PyTorch":[97],"JAX,":[99],"is":[101,183],"compatible":[102],"with":[103,143],"GPUs":[104],"from":[105],"Nvidia":[107],"AMD,":[109],"various":[113],"CPU":[114],"architectures,":[115],"including":[116],"x86":[117],"ARM.":[119],"In":[120],"addition,":[121],"integrates":[123],"GUI":[126],"allows":[128],"users":[129,142,163,188],"quickly":[131],"identify":[132,164],"hotpots":[133],"an":[135],"innovative":[136],"automated":[137],"analyzer":[139],"suggests":[141],"potential":[144],"optimizations":[145],"based":[146],"context.":[152],"Through":[153],"detailed":[154],"use":[155],"cases,":[156],"we":[157],"demonstrate":[158],"how":[159],"can":[161],"help":[162],"analyze":[166],"issues":[168],"enable":[170],"quick":[171],"effective":[173],"workloads.":[178],"We":[179],"believe":[180],"Deep":[181],"Context":[182],"valuable":[185],"tool":[186],"seeking":[189],"optimize":[191],"complex":[192],"workflows":[195],"multiple":[197],"compute":[198]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4404404018","counts_by_year":[],"updated_date":"2025-01-18T23:31:59.289243","created_date":"2024-11-16"}