{"id":"https://openalex.org/W4416203785","doi":"https://doi.org/10.1145/3712285.3759779","title":"A Sample-Free Compilation Framework for Efficient Dynamic Tensor Computation","display_name":"A Sample-Free Compilation Framework for Efficient Dynamic Tensor Computation","publication_year":2025,"publication_date":"2025-11-12","ids":{"openalex":"https://openalex.org/W4416203785","doi":"https://doi.org/10.1145/3712285.3759779"},"language":null,"primary_location":{"id":"doi:10.1145/3712285.3759779","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712285.3759779","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3712285.3759779","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078261857","display_name":"Yangjie Zhou","orcid":"https://orcid.org/0000-0002-3652-5437"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]},{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN","SG"],"is_corresponding":true,"raw_author_name":"Yangjie Zhou","raw_affiliation_strings":["Tencent, Shenzhen, China and National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Tencent, Shenzhen, China and National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596","https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100297617","display_name":"Honglin Zhu","orcid":"https://orcid.org/0009-0009-1703-1691"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Honglin Zhu","raw_affiliation_strings":["Tencent, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111345725","display_name":"Qian Qiu","orcid":"https://orcid.org/0000-0002-5210-8166"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qian Qiu","raw_affiliation_strings":["Tencent, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008837660","display_name":"Weihao Cui","orcid":"https://orcid.org/0000-0002-6646-5260"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weihao Cui","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100623100","display_name":"Zihan Liu","orcid":"https://orcid.org/0000-0002-0874-0682"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zihan Liu","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China and Shanghai Qi Zhi Institute, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China and Shanghai Qi Zhi Institute, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100338479","display_name":"Peng Chen","orcid":"https://orcid.org/0000-0003-1244-3151"},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Peng Chen","raw_affiliation_strings":["RIKEN Center for Computational Science, Kobe, Japan"],"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science, Kobe, Japan","institution_ids":["https://openalex.org/I4210129730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002208999","display_name":"Mohamed Wahib","orcid":"https://orcid.org/0000-0002-7165-2095"},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Mohamed Wahib","raw_affiliation_strings":["RIKEN Center for Computational Science, Kobe, Japan"],"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science, Kobe, Japan","institution_ids":["https://openalex.org/I4210129730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101706991","display_name":"Cong Guo","orcid":"https://orcid.org/0000-0002-4479-5525"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cong Guo","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110303119","display_name":"S.M. Feng","orcid":"https://orcid.org/0000-0002-4682-983X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siyuan Feng","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056275783","display_name":"Jintao Meng","orcid":"https://orcid.org/0000-0002-6208-4102"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jintao Meng","raw_affiliation_strings":["Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110799964","display_name":"Haidong Lan","orcid":"https://orcid.org/0000-0002-5231-4015"},"institutions":[{"id":"https://openalex.org/I105695857","display_name":"Siemens (Hungary)","ror":"https://ror.org/01rk7mv85","country_code":"HU","type":"company","lineage":["https://openalex.org/I105695857","https://openalex.org/I1325886976"]}],"countries":["HU"],"is_corresponding":false,"raw_author_name":"Haidong Lan","raw_affiliation_strings":["Taichi Graphics, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Taichi Graphics, Shenzhen, China","institution_ids":["https://openalex.org/I105695857"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003939279","display_name":"Jingwen Leng","orcid":"https://orcid.org/0000-0002-5660-5493"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingwen Leng","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China and Shanghai Qi Zhi Institute, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China and Shanghai Qi Zhi Institute, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063706766","display_name":"Yun Lin","orcid":"https://orcid.org/0000-0001-8255-0118"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yun Lin","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085067496","display_name":"Jin Song Dong","orcid":"https://orcid.org/0000-0002-6512-8326"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Jin Song Dong","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101131384","display_name":"Wenxi Zhu","orcid":"https://orcid.org/0009-0001-4933-4672"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenxi Zhu","raw_affiliation_strings":["Tencent, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083508620","display_name":"Minwen Deng","orcid":"https://orcid.org/0009-0005-8122-3023"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minwen Deng","raw_affiliation_strings":["Tencent, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":16,"corresponding_author_ids":["https://openalex.org/A5078261857"],"corresponding_institution_ids":["https://openalex.org/I165932596","https://openalex.org/I2250653659"],"apc_list":null,"apc_paid":null,"fwci":4.3965,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.94978301,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"167","last_page":"184"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.6262000203132629,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.6262000203132629,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.03830000013113022,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.028200000524520874,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6455000042915344},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.640999972820282},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6097999811172485},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.4772999882698059},{"id":"https://openalex.org/keywords/x86","display_name":"x86","score":0.4593000113964081},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.4544000029563904},{"id":"https://openalex.org/keywords/dynamic-compilation","display_name":"Dynamic compilation","score":0.39469999074935913},{"id":"https://openalex.org/keywords/tensor","display_name":"Tensor (intrinsic definition)","score":0.38519999384880066}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.824999988079071},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6455000042915344},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.640999972820282},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6236000061035156},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6097999811172485},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.4772999882698059},{"id":"https://openalex.org/C170723468","wikidata":"https://www.wikidata.org/wiki/Q182933","display_name":"x86","level":3,"score":0.4593000113964081},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.4544000029563904},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.40220001339912415},{"id":"https://openalex.org/C8767382","wikidata":"https://www.wikidata.org/wiki/Q1058454","display_name":"Dynamic compilation","level":3,"score":0.39469999074935913},{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.38519999384880066},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.3831999897956848},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3280999958515167},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.3188999891281128},{"id":"https://openalex.org/C190902152","wikidata":"https://www.wikidata.org/wiki/Q1325106","display_name":"Optimizing compiler","level":3,"score":0.31540000438690186},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.31349998712539673},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.31029999256134033},{"id":"https://openalex.org/C200833197","wikidata":"https://www.wikidata.org/wiki/Q333707","display_name":"Compile time","level":3,"score":0.30239999294281006},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2955999970436096},{"id":"https://openalex.org/C2779639559","wikidata":"https://www.wikidata.org/wiki/Q7661178","display_name":"Symbolic execution","level":3,"score":0.27140000462532043},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2700999975204468},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C189930140","wikidata":"https://www.wikidata.org/wiki/Q1112878","display_name":"CAS latency","level":4,"score":0.25450000166893005},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.2535000145435333}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3712285.3759779","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712285.3759779","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3712285.3759779","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712285.3759779","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G142312583","display_name":null,"funder_award_id":"U21B2017, 62222210","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2899272573","display_name":null,"funder_award_id":"AISG2-GC-2023-008-1B","funder_id":"https://openalex.org/F4320320741","funder_display_name":"DSO National Laboratories - Singapore"},{"id":"https://openalex.org/G2973132691","display_name":null,"funder_award_id":"NCRP25-P04-TAICeN, A-8002767-00-00","funder_id":"https://openalex.org/F4320320709","funder_display_name":"National Research Foundation Singapore"}],"funders":[{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"},{"id":"https://openalex.org/F4320320741","display_name":"DSO National Laboratories - Singapore","ror":"https://ror.org/03e05fb06"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W182691100","https://openalex.org/W1536680647","https://openalex.org/W2073061372","https://openalex.org/W2097117768","https://openalex.org/W2194775991","https://openalex.org/W2907492528","https://openalex.org/W2919115771","https://openalex.org/W2963770578","https://openalex.org/W2981758446","https://openalex.org/W2983655274","https://openalex.org/W2985556357","https://openalex.org/W3004423738","https://openalex.org/W3012249773","https://openalex.org/W3035038672","https://openalex.org/W3158027451","https://openalex.org/W3158444059","https://openalex.org/W3174529902","https://openalex.org/W3204647170","https://openalex.org/W4212986322","https://openalex.org/W4251637954","https://openalex.org/W4300527111","https://openalex.org/W4318541535","https://openalex.org/W4318541538","https://openalex.org/W4360831828","https://openalex.org/W4381785750","https://openalex.org/W4385585374","https://openalex.org/W4388620366","https://openalex.org/W4394998528","https://openalex.org/W4403196715"],"related_works":[],"abstract_inverted_index":{"Dynamic-shape":[0],"tensor":[1,34,73],"computation":[2],"poses":[3],"challenges":[4],"for":[5],"shape-specific":[6,117],"compilation":[7,35,39,46,58,137],"due":[8],"to":[9,43,71,82],"variable":[10],"input":[11],"dimensions.":[12],"Existing":[13],"compilers":[14,145],"rely":[15],"on":[16,26,125],"shape":[17,53],"samples,":[18],"incurring":[19],"high":[20],"tuning":[21,118],"costs":[22],"and":[23,40,48,78,102,111,119,130,146,150,158],"performance":[24],"degradation":[25],"unseen":[27],"inputs.":[28],"We":[29],"present":[30],"Helix,":[31],"a":[32],"dynamic":[33],"framework":[36],"with":[37,75],"sample-free":[38],"architecture-guided":[41],"optimization":[42],"achieve":[44],"both":[45],"efficiency":[47],"shape-general":[49],"performance.":[50],"To":[51],"avoid":[52],"sampling,":[54],"Helix":[55,135],"constructs":[56],"shape-agnostic":[57],"by":[59,139],"decomposing":[60],"computations":[61,74],"across":[62],"architectural":[63,76,100],"layers.":[64],"A":[65,91],"bidirectional":[66],"strategy":[67],"combines":[68],"top-down":[69],"abstraction":[70],"align":[72],"hierarchies,":[77],"bottom-up":[79],"kernel":[80],"construction":[81],"build":[83],"efficient":[84],"execution":[85,153],"strategies":[86],"from":[87],"reusable,":[88],"architecture-aligned":[89],"micro-kernels.":[90],"hybrid":[92],"analyzer":[93],"ensures":[94],"accuracy":[95],"through":[96,105],"profiling":[97],"at":[98,108],"lower":[99],"levels,":[101],"achieves":[103],"scalability":[104],"architecture-informed":[106],"modeling":[107],"higher":[109],"levels":[110],"runtime.":[112],"This":[113],"hierarchical":[114],"design":[115],"eliminates":[116],"enables":[120],"shape-adaptive":[121],"execution.":[122],"Evaluations":[123],"conducted":[124],"x86":[126],"CPUs,":[127,129],"ARM":[128],"NVIDIA":[131],"GPUs":[132],"demonstrate":[133],"that":[134],"reduces":[136],"time":[138],"174":[140],"\u00d7":[141,149,152],"over":[142,155],"the":[143],"existing":[144],"delivers":[147],"2.26":[148],"3.29":[151],"speedups":[154],"vendor":[156],"libraries":[157],"dynamic-shape":[159],"compilers,":[160],"respectively.":[161]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-11-12T00:00:00"}
