{"id":"https://openalex.org/W4395073460","doi":"https://doi.org/10.1145/3620666.3651369","title":"EVT: Accelerating Deep Learning Training with Epilogue Visitor Tree","display_name":"EVT: Accelerating Deep Learning Training with Epilogue Visitor Tree","publication_year":2024,"publication_date":"2024-04-24","ids":{"openalex":"https://openalex.org/W4395073460","doi":"https://doi.org/10.1145/3620666.3651369"},"language":"en","primary_location":{"id":"doi:10.1145/3620666.3651369","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3620666.3651369","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3620666.3651369","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037216840","display_name":"Zhaodong Chen","orcid":"https://orcid.org/0000-0001-9601-4586"},"institutions":[{"id":"https://openalex.org/I154570441","display_name":"University of California, Santa Barbara","ror":"https://ror.org/02t274463","country_code":"US","type":"education","lineage":["https://openalex.org/I154570441"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zhaodong Chen","raw_affiliation_strings":["University of California, Santa Barbara, Santa Barbara, United States of America"],"raw_orcid":"https://orcid.org/0000-0001-9601-4586","affiliations":[{"raw_affiliation_string":"University of California, Santa Barbara, Santa Barbara, United States of America","institution_ids":["https://openalex.org/I154570441"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102856962","display_name":"Andrew Kerr","orcid":"https://orcid.org/0009-0003-5708-0216"},"institutions":[{"id":"https://openalex.org/I4210127875","display_name":"Nvidia (United States)","ror":"https://ror.org/03jdj4y14","country_code":"US","type":"company","lineage":["https://openalex.org/I4210127875"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrew Kerr","raw_affiliation_strings":["NVIDIA, Santa Clara, USA"],"raw_orcid":"https://orcid.org/0009-0003-5708-0216","affiliations":[{"raw_affiliation_string":"NVIDIA, Santa Clara, USA","institution_ids":["https://openalex.org/I4210127875"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065265831","display_name":"Richard Cai","orcid":"https://orcid.org/0009-0000-5645-6718"},"institutions":[{"id":"https://openalex.org/I4210127875","display_name":"Nvidia (United States)","ror":"https://ror.org/03jdj4y14","country_code":"US","type":"company","lineage":["https://openalex.org/I4210127875"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Richard Cai","raw_affiliation_strings":["NVIDIA, Santa Clara, USA"],"raw_orcid":"https://orcid.org/0009-0000-5645-6718","affiliations":[{"raw_affiliation_string":"NVIDIA, Santa Clara, USA","institution_ids":["https://openalex.org/I4210127875"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034516607","display_name":"Jack Kosaian","orcid":"https://orcid.org/0000-0001-8812-7847"},"institutions":[{"id":"https://openalex.org/I4210127875","display_name":"Nvidia (United States)","ror":"https://ror.org/03jdj4y14","country_code":"US","type":"company","lineage":["https://openalex.org/I4210127875"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jack Kosaian","raw_affiliation_strings":["NVIDIA, Santa Clara, USA"],"raw_orcid":"https://orcid.org/0000-0001-8812-7847","affiliations":[{"raw_affiliation_string":"NVIDIA, Santa Clara, USA","institution_ids":["https://openalex.org/I4210127875"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003741499","display_name":"Haicheng Wu","orcid":"https://orcid.org/0000-0003-0357-9049"},"institutions":[{"id":"https://openalex.org/I4210127875","display_name":"Nvidia (United States)","ror":"https://ror.org/03jdj4y14","country_code":"US","type":"company","lineage":["https://openalex.org/I4210127875"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haicheng Wu","raw_affiliation_strings":["NVIDIA, Santa Clara, USA"],"raw_orcid":"https://orcid.org/0000-0003-0357-9049","affiliations":[{"raw_affiliation_string":"NVIDIA, Santa Clara, USA","institution_ids":["https://openalex.org/I4210127875"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048052285","display_name":"Yufei Ding","orcid":"https://orcid.org/0000-0002-8716-5793"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yufei Ding","raw_affiliation_strings":["University of California San Diego, San Diego, United States of America"],"raw_orcid":"https://orcid.org/0000-0002-8716-5793","affiliations":[{"raw_affiliation_string":"University of California San Diego, San Diego, United States of America","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100385336","display_name":"Yuan Xie","orcid":"https://orcid.org/0000-0003-2093-1788"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yuan Xie","raw_affiliation_strings":["The Hong Kong University of Science and Technology, HongKong, China"],"raw_orcid":"https://orcid.org/0000-0003-2093-1788","affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology, HongKong, China","institution_ids":["https://openalex.org/I200769079"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5037216840"],"corresponding_institution_ids":["https://openalex.org/I154570441"],"apc_list":null,"apc_paid":null,"fwci":0.7142,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.68973389,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"301","last_page":"316"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8026505708694458},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6863546371459961},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.6533563137054443},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5560570359230042},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5397425889968872},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.4855911135673523},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4761514663696289},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.47029754519462585},{"id":"https://openalex.org/keywords/debugging","display_name":"Debugging","score":0.46201980113983154},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.43638676404953003},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.4309362471103668},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3892923593521118},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.37617185711860657},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3315662145614624},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.16234397888183594},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.15995565056800842}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8026505708694458},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6863546371459961},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.6533563137054443},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5560570359230042},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5397425889968872},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.4855911135673523},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4761514663696289},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.47029754519462585},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.46201980113983154},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.43638676404953003},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.4309362471103668},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3892923593521118},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.37617185711860657},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3315662145614624},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.16234397888183594},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.15995565056800842},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3620666.3651369","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3620666.3651369","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-147982","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-147982","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":{"id":"doi:10.1145/3620666.3651369","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3620666.3651369","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1836465849","https://openalex.org/W2049287714","https://openalex.org/W2138233678","https://openalex.org/W2142498761","https://openalex.org/W2161455936","https://openalex.org/W2194775991","https://openalex.org/W2519887557","https://openalex.org/W2595551253","https://openalex.org/W2728444714","https://openalex.org/W2739996966","https://openalex.org/W2804032941","https://openalex.org/W2811130204","https://openalex.org/W2896457183","https://openalex.org/W2914209329","https://openalex.org/W2949967139","https://openalex.org/W2954698171","https://openalex.org/W2970971581","https://openalex.org/W2999905431","https://openalex.org/W3004659153","https://openalex.org/W3035582633","https://openalex.org/W3132695675","https://openalex.org/W3208099998","https://openalex.org/W4253605282","https://openalex.org/W4321446237","https://openalex.org/W6681029592"],"related_works":["https://openalex.org/W3000097931","https://openalex.org/W2354322770","https://openalex.org/W4321442002","https://openalex.org/W4237547500","https://openalex.org/W1570848052","https://openalex.org/W2373192430","https://openalex.org/W2015265939","https://openalex.org/W2284072287","https://openalex.org/W4239268388","https://openalex.org/W2611067230"],"abstract_inverted_index":{"As":[0],"deep":[1,8],"learning":[2,9],"models":[3],"become":[4],"increasingly":[5],"complex,":[6],"the":[7,15,40,65],"compilers":[10,33,89],"are":[11],"critical":[12],"for":[13,83],"enhancing":[14],"system":[16],"efficiency":[17],"and":[18,55,72,80],"unlocking":[19],"hidden":[20],"optimization":[21,59],"opportunities.":[22],"Although":[23],"excellent":[24],"speedups":[25],"have":[26],"been":[27],"achieved":[28],"in":[29,37,77],"inference":[30],"workloads,":[31],"existing":[32,88],"face":[34],"significant":[35],"limitations":[36],"training.":[38],"Firstly,":[39],"training":[41,66],"computation":[42],"graph":[43],"involves":[44],"intricate":[45],"operations":[46],"challenging":[47],"to":[48],"fuse,":[49],"such":[50],"as":[51],"normalization,":[52],"loss":[53],"functions,":[54],"reductions,":[56],"which":[57],"limit":[58],"opportunities":[60],"like":[61],"kernel":[62,84],"fusion.":[63,85],"Secondly,":[64],"graph's":[67],"additional":[68],"edges":[69],"connecting":[70],"forward":[71],"backward":[73],"operators":[74],"pose":[75],"challenges":[76],"finding":[78],"optimal":[79],"feasible":[81],"partitions":[82],"More":[86],"importantly,":[87],"cannot":[90],"either":[91],"generate":[92],"kernels":[93],"with":[94],"state-of-the-art":[95],"performance":[96],"on":[97],"modern":[98],"GPUs":[99],"or":[100],"accommodate":[101],"diverse":[102],"fusion":[103],"patterns.":[104]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
