{"id":"https://openalex.org/W4413014925","doi":"https://doi.org/10.1145/3676642.3736127","title":"DeepContext: A Context-aware, Cross-platform, and Cross-framework Tool for Performance Profiling and Analysis of Deep Learning Workloads","display_name":"DeepContext: A Context-aware, Cross-platform, and Cross-framework Tool for Performance Profiling and Analysis of Deep Learning Workloads","publication_year":2025,"publication_date":"2025-08-06","ids":{"openalex":"https://openalex.org/W4413014925","doi":"https://doi.org/10.1145/3676642.3736127"},"language":"en","primary_location":{"id":"doi:10.1145/3676642.3736127","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3676642.3736127","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3676642.3736127","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3676642.3736127","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101844131","display_name":"Qidong Zhao","orcid":"https://orcid.org/0000-0002-0872-1246"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Qidong Zhao","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109756842","display_name":"Hao Wu","orcid":"https://orcid.org/0009-0003-6318-4505"},"institutions":[{"id":"https://openalex.org/I162714631","display_name":"George Mason University","ror":"https://ror.org/02jqj7156","country_code":"US","type":"education","lineage":["https://openalex.org/I162714631"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hao Wu","raw_affiliation_strings":["George Mason University, Fairfax, VA, USA"],"affiliations":[{"raw_affiliation_string":"George Mason University, Fairfax, VA, USA","institution_ids":["https://openalex.org/I162714631"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015357791","display_name":"Yueming Hao","orcid":"https://orcid.org/0000-0002-4792-6244"},"institutions":[{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yueming Hao","raw_affiliation_strings":["Meta, Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Meta, Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zilingfeng Ye","orcid":"https://orcid.org/0009-0003-5437-0445"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zilingfeng Ye","raw_affiliation_strings":["Independent, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Independent, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100454305","display_name":"Jiajia Li","orcid":"https://orcid.org/0000-0003-1270-4147"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiajia Li","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013392225","display_name":"Xu Liu","orcid":"https://orcid.org/0000-0002-1487-963X"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xu Liu","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063326523","display_name":"Keren Zhou","orcid":"https://orcid.org/0000-0002-7977-3182"},"institutions":[{"id":"https://openalex.org/I162714631","display_name":"George Mason University","ror":"https://ror.org/02jqj7156","country_code":"US","type":"education","lineage":["https://openalex.org/I162714631"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Keren Zhou","raw_affiliation_strings":["George Mason University, Fairfax, VA, USA"],"affiliations":[{"raw_affiliation_string":"George Mason University, Fairfax, VA, USA","institution_ids":["https://openalex.org/I162714631"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101844131"],"corresponding_institution_ids":["https://openalex.org/I137902535"],"apc_list":null,"apc_paid":null,"fwci":1.4196,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.85026865,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"48","last_page":"63"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.8849373459815979},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7665749788284302},{"id":"https://openalex.org/keywords/cross-platform","display_name":"Cross-platform","score":0.4648318290710449},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.432547390460968},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4190787971019745},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.35301142930984497},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3404988944530487},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.19781872630119324}],"concepts":[{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.8849373459815979},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7665749788284302},{"id":"https://openalex.org/C92400490","wikidata":"https://www.wikidata.org/wiki/Q174666","display_name":"Cross-platform","level":2,"score":0.4648318290710449},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.432547390460968},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4190787971019745},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.35301142930984497},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3404988944530487},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.19781872630119324},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3676642.3736127","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3676642.3736127","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3676642.3736127","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3676642.3736127","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3676642.3736127","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3676642.3736127","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4126240652","display_name":null,"funder_award_id":"2411134","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"}],"funders":[{"id":"https://openalex.org/F4320323817","display_name":"Universitas Brawijaya","ror":"https://ror.org/01wk3d929"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4413014925.pdf"},"referenced_works_count":15,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W2108598243","https://openalex.org/W2136434791","https://openalex.org/W2194775991","https://openalex.org/W2337381441","https://openalex.org/W2760656271","https://openalex.org/W3049119995","https://openalex.org/W3101330584","https://openalex.org/W3127495619","https://openalex.org/W3130647239","https://openalex.org/W3199133416","https://openalex.org/W3200843682","https://openalex.org/W4283024785","https://openalex.org/W4390872297","https://openalex.org/W4394998532"],"related_works":["https://openalex.org/W4375867731","https://openalex.org/W2161444195","https://openalex.org/W2985540061","https://openalex.org/W2589019771","https://openalex.org/W2185012154","https://openalex.org/W4252521128","https://openalex.org/W2104014222","https://openalex.org/W4287867321","https://openalex.org/W4404404018","https://openalex.org/W4413014925"],"abstract_inverted_index":{"Effective":[0],"performance":[1,70,77,122,137],"optimization":[2,82],"of":[3,63,89,94],"deep":[4,44,65,95,102],"learning":[5,45,66,96,103],"models":[6],"requires":[7],"comprehensive":[8],"profiling":[9,35],"across":[10,41],"heterogeneous":[11],"computing":[12],"environments,":[13],"yet":[14],"existing":[15],"tools":[16],"fail":[17],"to":[18,134],"bridge":[19],"the":[20,61,64,90],"semantic":[21],"gap":[22],"between":[23,141],"high-level":[24],"operations":[25],"and":[26,49,105,143],"low-level":[27],"execution.":[28,51],"This":[29],"paper":[30],"presents":[31],"DeepContext,":[32,130],"a":[33,54],"novel":[34],"system":[36],"that":[37,58,79,117],"correlates":[38,60],"program":[39],"contexts":[40],"Python":[42],"code,":[43],"frameworks,":[46],"C/C++":[47],"libraries,":[48],"GPU":[50],"DeepContext":[52,73,98,118],"features":[53],"framework-agnostic":[55],"shim":[56],"layer":[57],"seamlessly":[59],"behavior":[62],"framework":[67],"with":[68,111],"hardware":[69],"metrics.":[71],"Furthermore,":[72],"provides":[74],"an":[75],"automated":[76],"analyzer":[78],"offers":[80],"actionable":[81],"guidance":[83],"based":[84],"on":[85,107],"its":[86],"holistic":[87],"view":[88],"entire":[91],"software":[92],"stack":[93],"applications.":[97,127],"works":[99],"for":[100],"mainstream":[101],"frameworks":[104],"runs":[106],"modern":[108],"CPU+GPU":[109],"architectures":[110],"low":[112],"overhead.":[113],"Our":[114],"evaluation":[115],"demonstrates":[116],"uncovers":[119],"previously":[120],"hidden":[121],"bottlenecks":[123],"in":[124],"real-world":[125],"deep-learning":[126],"Guided":[128],"by":[129],"we":[131],"are":[132],"able":[133],"fix":[135],"multiple":[136],"issues,":[138],"achieving":[139],"speed-ups":[140],"1.06\u00d7":[142],"1.66\u00d7.":[144]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
