{"id":"https://openalex.org/W7150837152","doi":"https://doi.org/10.48550/arxiv.2604.02525","title":"AdaHOP: Fast and Accurate Low-Precision Training via Outlier-Pattern-Aware Rotation","display_name":"AdaHOP: Fast and Accurate Low-Precision Training via Outlier-Pattern-Aware Rotation","publication_year":2026,"publication_date":"2026-04-02","ids":{"openalex":"https://openalex.org/W7150837152","doi":"https://doi.org/10.48550/arxiv.2604.02525"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.02525","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02525","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.02525","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111156777","display_name":"Seonggon Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Seonggon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082105097","display_name":"Alireza Khodamoradi","orcid":"https://orcid.org/0000-0001-8811-2258"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khodamoradi, Alireza","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035560671","display_name":"Kristof Denolf","orcid":"https://orcid.org/0000-0001-6668-4562"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vasireddy, Pranathi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064884832","display_name":"Eunhyeok Park","orcid":"https://orcid.org/0000-0002-7331-9819"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Denolf, Kristof","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Park, Eunhyeok","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Eunhyeok","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.1607999950647354,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.1607999950647354,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.14970000088214874,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.12540000677108765,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.7146000266075134},{"id":"https://openalex.org/keywords/smoothing","display_name":"Smoothing","score":0.7063999772071838},{"id":"https://openalex.org/keywords/hadamard-transform","display_name":"Hadamard transform","score":0.5616000294685364},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.555899977684021},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4715000092983246},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.42340001463890076},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4156000018119812},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.41429999470710754}],"concepts":[{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.7146000266075134},{"id":"https://openalex.org/C3770464","wikidata":"https://www.wikidata.org/wiki/Q775963","display_name":"Smoothing","level":2,"score":0.7063999772071838},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5845999717712402},{"id":"https://openalex.org/C60292330","wikidata":"https://www.wikidata.org/wiki/Q1014065","display_name":"Hadamard transform","level":2,"score":0.5616000294685364},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.555899977684021},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5511000156402588},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4715000092983246},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4677000045776367},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.42340001463890076},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4156000018119812},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.41429999470710754},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.35100001096725464},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.33980000019073486},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.3391000032424927},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.33180001378059387},{"id":"https://openalex.org/C196216189","wikidata":"https://www.wikidata.org/wiki/Q2867","display_name":"Wavelet transform","level":3,"score":0.33149999380111694},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.3107999861240387},{"id":"https://openalex.org/C74050887","wikidata":"https://www.wikidata.org/wiki/Q848368","display_name":"Rotation (mathematics)","level":2,"score":0.31040000915527344},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.28290000557899475},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.27649998664855957},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.25200000405311584}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.02525","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02525","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.02525","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.02525","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Hadamard":[0,31,91,99],"transforms":[1],"have":[2],"become":[3],"a":[4,49,81,124],"key":[5],"tool":[6],"for":[7],"stabilizing":[8],"low-precision":[9],"training,":[10,59],"but":[11],"existing":[12],"methods":[13],"apply":[14],"them":[15],"uniformly":[16],"across":[17],"tensors":[18],"and":[19,55,68,70,110],"computation":[20],"paths.":[21],"We":[22,87],"show":[23,71],"that":[24,72,116],"this":[25],"one-size-fits-all":[26],"strategy":[27],"is":[28,40],"inherently":[29],"limited:":[30],"smoothing":[32],"reduces":[33],"quantization":[34],"error":[35],"only":[36],"when":[37,102,127],"its":[38],"direction":[39],"properly":[41,105],"aligned":[42],"with":[43,93,144],"the":[44,107],"operand's":[45],"outlier":[46,64,74,119],"structure.":[47],"Through":[48],"systematic":[50],"study":[51],"of":[52],"weights,":[53],"activations,":[54],"gradients":[56],"in":[57,77],"LLM":[58],"we":[60],"identify":[61],"three":[62],"stable":[63],"patterns,":[65],"Row-wise,":[66],"Column-wise,":[67],"None,":[69],"each":[73],"pattern":[75],"pair":[76],"matrix":[78],"multiplication":[79],"requires":[80],"distinct":[82],"transform":[83,92],"or":[84,121],"outlier-handling":[85],"strategy.":[86],"propose":[88],"AdaHOP,":[89],"Adaptive":[90],"Outlier-Pattern-aware":[94],"strategy,":[95],"which":[96],"applies":[97,112],"Inner":[98],"Transform":[100],"(IHT)":[101],"inner-dimension":[103],"mixing":[104],"suppresses":[106],"operands'":[108],"outliers,":[109],"selectively":[111],"Outlier":[113],"Extraction":[114],"(OE)":[115],"extracts":[117],"dominant":[118],"rows":[120],"columns":[122],"into":[123],"high-precision":[125],"path":[126],"it":[128],"does":[129],"not.":[130],"With":[131],"fused,":[132],"hardware-aware":[133],"Triton":[134],"kernels,":[135],"AdaHOP":[136],"enables":[137],"training":[138,156],"from":[139],"scratch":[140],"at":[141],"MXFP4":[142],"precision":[143],"BF16-level":[145],"quality,":[146],"while":[147],"achieving":[148],"up":[149],"to":[150],"3.6X":[151],"memory":[152],"compression,":[153],"1.46X":[154],"end-to-end":[155],"speedup":[157],"over":[158],"BF16.":[159]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-07T00:00:00"}
