{"id":"https://openalex.org/W7131377983","doi":"https://doi.org/10.48550/arxiv.2602.19762","title":"Hexagon-MLIR: An AI Compilation Stack For Qualcomm's Neural Processing Units (NPUs)","display_name":"Hexagon-MLIR: An AI Compilation Stack For Qualcomm's Neural Processing Units (NPUs)","publication_year":2026,"publication_date":"2026-02-23","ids":{"openalex":"https://openalex.org/W7131377983","doi":"https://doi.org/10.48550/arxiv.2602.19762"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.19762","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19762","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.19762","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080005521","display_name":"Mohammed Javed Absar","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Absar, Mohammed Javed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104040289","display_name":"Muthu Manikandan Baskaran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baskaran, Muthu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126672823","display_name":"Abhikrant Sharma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Abhikrant","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003819598","display_name":"Abhilash Bhandari","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhandari, Abhilash","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126726992","display_name":"Ankit Aggarwal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aggarwal, Ankit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011358174","display_name":"Arun Rangasamy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rangasamy, Arun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126793480","display_name":"Dibyendu Das","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Das, Dibyendu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069422613","display_name":"Fateme S. Hosseini","orcid":"https://orcid.org/0000-0002-9091-3908"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hosseini, Fateme","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034883170","display_name":"Franck Slama","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Slama, Franck","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014379085","display_name":"Iulian Brumar","orcid":"https://orcid.org/0000-0003-0403-856X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brumar, Iulian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126736325","display_name":"Jyotsna Verma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Verma, Jyotsna","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126727978","display_name":"Krishnaprasad Bindumadhavan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bindumadhavan, Krishnaprasad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043574439","display_name":"Mitesh Kothari","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kothari, Mitesh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126793476","display_name":"Mohit Gupta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gupta, Mohit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126691833","display_name":"Ravishankar Kolachana","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kolachana, Ravishankar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108503417","display_name":"Richard Lethin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lethin, Richard","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116182780","display_name":"Samarth Narang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Narang, Samarth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013435163","display_name":"Sanjay Motilal Ladwa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ladwa, Sanjay Motilal","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007339313","display_name":"Shalini Jain","orcid":"https://orcid.org/0000-0001-6965-4967"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jain, Shalini","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126712661","display_name":"Snigdha Suresh Dalvi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dalvi, Snigdha Suresh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126673941","display_name":"Tasmia Rahman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rahman, Tasmia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126713814","display_name":"Venkat Rasagna Reddy Komatireddy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Komatireddy, Venkat Rasagna Reddy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126738646","display_name":"Vivek Vasudevbhai Pandya","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pandya, Vivek Vasudevbhai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126727500","display_name":"Xiyue Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Xiyue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5028706797","display_name":"Zachary Zipper","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zipper, Zachary","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":25,"corresponding_author_ids":["https://openalex.org/A5080005521"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.3781999945640564,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.3781999945640564,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.29490000009536743,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.022700000554323196,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.7055000066757202},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.6039999723434448},{"id":"https://openalex.org/keywords/stack","display_name":"Stack (abstract data type)","score":0.5764999985694885},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5644000172615051},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.47609999775886536},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.45809999108314514},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4081000089645386},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.4025999903678894}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8528000116348267},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.7055000066757202},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.6039999723434448},{"id":"https://openalex.org/C9395851","wikidata":"https://www.wikidata.org/wiki/Q177929","display_name":"Stack (abstract data type)","level":2,"score":0.5764999985694885},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5644000172615051},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.47609999775886536},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4595000147819519},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.45809999108314514},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4081000089645386},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.4025999903678894},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.37630000710487366},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.35589998960494995},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.35010001063346863},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.34040001034736633},{"id":"https://openalex.org/C200833197","wikidata":"https://www.wikidata.org/wiki/Q333707","display_name":"Compile time","level":3,"score":0.32749998569488525},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.3221000134944916},{"id":"https://openalex.org/C27602214","wikidata":"https://www.wikidata.org/wiki/Q1868547","display_name":"Locality of reference","level":3,"score":0.3203999996185303},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30889999866485596},{"id":"https://openalex.org/C119024030","wikidata":"https://www.wikidata.org/wiki/Q759899","display_name":"Call stack","level":3,"score":0.2994000017642975},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.29840001463890076},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.2816999852657318},{"id":"https://openalex.org/C157170001","wikidata":"https://www.wikidata.org/wiki/Q4781507","display_name":"Applications of artificial intelligence","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2644999921321869}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.19762","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19762","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.19762","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19762","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.4718742072582245}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1,148],"paper,":[2],"we":[3,80,137],"present":[4],"Hexagon-MLIR,an":[5],"open-source":[6,113],"compilation":[7,71,115,125],"stack":[8,116],"that":[9,83,117],"targets":[10],"Qualcomm":[11],"Hexagon":[12],"Neural":[13],"Processing":[14],"Unit":[15],"(NPU)":[16],"and":[17,25,136,145],"provides":[18],"unified":[19],"support":[20],"for":[21,65],"lowering":[22],"Triton":[23,57,78],"kernels":[24,58],"PyTorch":[26,63],"models":[27],".":[28],"Built":[29],"using":[30],"the":[31,88,95],"MLIR":[32],"framework,":[33],"our":[34,66,105],"compiler":[35],"applies":[36],"a":[37,120,128,134],"structured":[38],"sequence":[39],"of":[40,55],"passes":[41],"to":[42,47,74,122,140],"exploit":[43],"NPU":[44],"architectural":[45],"features":[46],"accelerate":[48],"AI":[49,124],"workloads.":[50],"It":[51],"enables":[52],"faster":[53],"deployment":[54],"new":[56],"(hand-written":[59],"or":[60],"subgraphs":[61],"from":[62,72],"2.0),":[64],"target":[67],"by":[68,108],"providing":[69,109],"automated":[70],"kernel":[73],"binary.":[75],"By":[76],"ingesting":[77],"kernels,":[79],"generate":[81],"mega-kernels":[82],"maximize":[84],"data":[85],"locality":[86],"in":[87,99,147],"NPU's":[89],"Tightly":[90],"Coupled":[91],"Memory":[92],"(TCM),":[93],"reducing":[94],"bandwidth":[96],"bottlenecks":[97],"inherent":[98],"library-based":[100],"approaches.":[101],"This":[102],"initiative":[103],"complements":[104],"commercial":[106],"toolchains":[107],"developers":[110],"with":[111],"an":[112],"MLIR-based":[114],"gives":[118],"them":[119],"path":[121],"advance":[123],"capabilities":[126,146],"through":[127],"more":[129,143],"flexible":[130],"approach.":[131],"Hexagon-MLIR":[132],"is":[133],"work-in-progress,":[135],"are":[138],"continuing":[139],"add":[141],"many":[142],"optimizations":[144],"effort.":[149]},"counts_by_year":[],"updated_date":"2026-02-26T06:34:08.959763","created_date":"2026-02-26T00:00:00"}
