{"id":"https://openalex.org/W4399282189","doi":"https://doi.org/10.1145/3650200.3656631","title":"Fasor: A Fast Tensor Program Optimization Framework for Efficient DNN Deployment","display_name":"Fasor: A Fast Tensor Program Optimization Framework for Efficient DNN Deployment","publication_year":2024,"publication_date":"2024-05-30","ids":{"openalex":"https://openalex.org/W4399282189","doi":"https://doi.org/10.1145/3650200.3656631"},"language":"en","primary_location":{"id":"doi:10.1145/3650200.3656631","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3650200.3656631","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3650200.3656631","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 38th ACM International Conference on Supercomputing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3650200.3656631","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064549619","display_name":"Hanxian Huang","orcid":"https://orcid.org/0000-0001-6338-3289"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hanxian Huang","raw_affiliation_strings":["University of California San Diego, USA"],"raw_orcid":"https://orcid.org/0000-0001-6338-3289","affiliations":[{"raw_affiliation_string":"University of California San Diego, USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100363116","display_name":"Xin Chen","orcid":"https://orcid.org/0000-0003-1950-2468"},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xin Chen","raw_affiliation_strings":["Intel, USA"],"raw_orcid":"https://orcid.org/0000-0003-1950-2468","affiliations":[{"raw_affiliation_string":"Intel, USA","institution_ids":["https://openalex.org/I1343180700"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5095044690","display_name":"Jishen Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jishen Zhao","raw_affiliation_strings":["University of California San Diego, United States of America"],"raw_orcid":"https://orcid.org/0000-0002-8766-0946","affiliations":[{"raw_affiliation_string":"University of California San Diego, United States of America","institution_ids":["https://openalex.org/I36258959"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5064549619"],"corresponding_institution_ids":["https://openalex.org/I36258959"],"apc_list":null,"apc_paid":null,"fwci":1.4231,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.80423149,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"498","last_page":"510"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.982200026512146,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7473055720329285},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.7129940390586853},{"id":"https://openalex.org/keywords/tensor","display_name":"Tensor (intrinsic definition)","score":0.7122964859008789},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5887163877487183},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.44249674677848816},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4396214187145233},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4287060797214508},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3529099225997925},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3399754762649536},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27587229013442993},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.13781824707984924},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13349395990371704},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.13224759697914124}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7473055720329285},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.7129940390586853},{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.7122964859008789},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5887163877487183},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.44249674677848816},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4396214187145233},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4287060797214508},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3529099225997925},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3399754762649536},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27587229013442993},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.13781824707984924},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13349395990371704},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.13224759697914124},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3650200.3656631","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3650200.3656631","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3650200.3656631","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 38th ACM International Conference on Supercomputing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3650200.3656631","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3650200.3656631","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3650200.3656631","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 38th ACM International Conference on Supercomputing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4399282189.pdf"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W1971106787","https://openalex.org/W2002555321","https://openalex.org/W2013062050","https://openalex.org/W2077143534","https://openalex.org/W2123162799","https://openalex.org/W2172654076","https://openalex.org/W2194775991","https://openalex.org/W2809409253","https://openalex.org/W2905135312","https://openalex.org/W2905872298","https://openalex.org/W2912500072","https://openalex.org/W2961619211","https://openalex.org/W2963163009","https://openalex.org/W2963918968","https://openalex.org/W2970971581","https://openalex.org/W2981985696","https://openalex.org/W3008788679","https://openalex.org/W3011411500","https://openalex.org/W3012249773","https://openalex.org/W3035582633","https://openalex.org/W3138578552","https://openalex.org/W3157020554","https://openalex.org/W3200687135","https://openalex.org/W3211053593","https://openalex.org/W4221062244","https://openalex.org/W4251637954","https://openalex.org/W4318256790","https://openalex.org/W4318541553","https://openalex.org/W4320519434","https://openalex.org/W4327930463","https://openalex.org/W4390672384","https://openalex.org/W6713134421"],"related_works":["https://openalex.org/W2770234245","https://openalex.org/W96612179","https://openalex.org/W4229499248","https://openalex.org/W2566006169","https://openalex.org/W1567818861","https://openalex.org/W2987774938","https://openalex.org/W4256492088","https://openalex.org/W632915154","https://openalex.org/W2055733372","https://openalex.org/W3022067003"],"abstract_inverted_index":{"With":[0],"the":[1,17,52,70,85],"growing":[2],"importance":[3],"of":[4,21,55,61,72,87],"deploying":[5],"deep":[6],"neural":[7],"networks":[8],"(DNNs),":[9],"there":[10,79],"are":[11],"increasing":[12],"demands":[13],"to":[14,41,51],"improve":[15],"both":[16],"efficiency":[18,86],"and":[19,48,57],"quality":[20,71],"tensor":[22,36,77,91],"program":[23,31,37],"optimization":[24,95],"(TPO).":[25],"TPO":[26,45],"involves":[27],"searching":[28],"for":[29,33],"possible":[30],"transformations":[32,56],"a":[34],"given":[35],"on":[38,69,84],"target":[39],"hardware":[40],"optimize":[42],"its":[43],"execution.":[44],"is":[46],"challenging":[47],"expensive":[49],"due":[50],"exponential":[53],"combinations":[54],"time-consuming":[58],"on-device":[59],"measurement":[60],"transformations.":[62],"While":[63],"prior":[64],"research":[65],"has":[66,80],"primarily":[67],"focused":[68],"TPO,":[73,88],"i.e.,":[74,89],"generating":[75],"high-performance":[76],"programs,":[78],"been":[81],"less":[82],"emphasis":[83],"optimizing":[90],"programs":[92],"with":[93],"low":[94],"time":[96],"overhead.":[97]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
