{"id":"https://openalex.org/W7161282589","doi":"https://doi.org/10.48550/arxiv.2605.14047","title":"Evolving Layer-Specific Scalar Functions for Hardware-Aware Transformer Adaptation","display_name":"Evolving Layer-Specific Scalar Functions for Hardware-Aware Transformer Adaptation","publication_year":2026,"publication_date":"2026-05-13","ids":{"openalex":"https://openalex.org/W7161282589","doi":"https://doi.org/10.48550/arxiv.2605.14047"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.14047","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14047","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.14047","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136253238","display_name":"Kieran Carrigg","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Carrigg, Kieran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099051616","display_name":"Sigur de Vries","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Vries, Sigur","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093461258","display_name":"Amirhossein Sadough","orcid":"https://orcid.org/0009-0005-5647-2888"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sadough, Amirhossein","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5074794877","display_name":"Marcel van Gerven","orcid":"https://orcid.org/0000-0002-2206-9098"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"van Gerven, Marcel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.3702000081539154,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.3702000081539154,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.15929999947547913,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.15440000593662262,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7232000231742859},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.5809000134468079},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.39959999918937683},{"id":"https://openalex.org/keywords/scalar","display_name":"Scalar (mathematics)","score":0.3880999982357025},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.37689998745918274},{"id":"https://openalex.org/keywords/homogeneous","display_name":"Homogeneous","score":0.37119999527931213}],"concepts":[{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7232000231742859},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.5809000134468079},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5184999704360962},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4088999927043915},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.39959999918937683},{"id":"https://openalex.org/C57691317","wikidata":"https://www.wikidata.org/wiki/Q1289248","display_name":"Scalar (mathematics)","level":2,"score":0.3880999982357025},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.37689998745918274},{"id":"https://openalex.org/C66882249","wikidata":"https://www.wikidata.org/wiki/Q169336","display_name":"Homogeneous","level":2,"score":0.37119999527931213},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3280999958515167},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.30649998784065247},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.2994999885559082},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2992999851703644},{"id":"https://openalex.org/C110332635","wikidata":"https://www.wikidata.org/wiki/Q629498","display_name":"Genetic programming","level":2,"score":0.29589998722076416},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.2639000117778778},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2637999951839447},{"id":"https://openalex.org/C184720557","wikidata":"https://www.wikidata.org/wiki/Q7825049","display_name":"Topology (electrical circuits)","level":2,"score":0.25940001010894775}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.14047","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14047","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.14047","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14047","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vision":[0],"Transformers":[1],"(ViTs)":[2],"achieve":[3],"state-of-the-art":[4],"performance":[5,145],"on":[6,13,59,176],"challenging":[7],"vision":[8],"tasks,":[9],"but":[10],"their":[11],"deployment":[12,173],"edge":[14,177],"devices":[15],"is":[16],"severely":[17],"hindered":[18],"by":[19,28,37],"the":[20,98,111,118,148,171],"computational":[21],"complexity":[22,161],"and":[23,57,162],"global":[24,149],"reduction":[25,150],"bottleneck":[26],"imposed":[27],"layer":[29],"normalization.":[30],"Recent":[31],"methods":[32],"attempt":[33],"to":[34,53,78,100,122,132,170],"bypass":[35],"this":[36,64,144],"replacing":[38],"normalization":[39,113],"layers":[40],"with":[41,89],"hardware-friendly":[42],"scalar":[43,82],"approximations.":[44],"However,":[45],"these":[46],"homogeneous":[47,126],"replacements":[48],"do":[49],"not":[50],"optimally":[51],"fit":[52],"all":[54],"layers'":[55],"behaviour":[56],"rely":[58],"expensive":[60],"model":[61],"retraining.":[62],"In":[63],"work,":[65],"we":[66],"propose":[67],"a":[68,90,155,167],"highly":[69,156],"efficient,":[70],"hardware-aware":[71],"framework":[72],"that":[73],"utilizes":[74],"genetic":[75],"programming":[76],"(GP)":[77],"evolve":[79],"heterogeneous,":[80],"layer-specific":[81],"functions":[83],"directly":[84],"from":[85,103],"pre-trained":[86],"weights.":[87],"Coupled":[88],"novel":[91],"post-training":[92],"re-alignment":[93],"strategy,":[94],"our":[95,129,152],"approach":[96,153],"eliminates":[97],"need":[99],"retrain":[101],"models":[102],"scratch":[104],"entirely.":[105],"Our":[106],"evolved":[107],"expressions":[108],"accurately":[109],"approximate":[110],"target":[112],"behaviours,":[114],"capturing":[115],"$91.6\\%$":[116],"of":[117,174],"variance":[119],"($R^2$)":[120],"compared":[121],"only":[123,139],"$70.2\\%$":[124],"for":[125],"baselines,":[127],"allowing":[128],"modified":[130],"architecture":[131],"recover":[133],"$84.25\\%$":[134],"Top-1":[135],"ImageNet-1K":[136],"accuracy":[137],"in":[138],"20":[140],"epochs.":[141],"By":[142],"preserving":[143],"while":[146],"eliminating":[147],"bottleneck,":[151],"establishes":[154],"favourable":[157],"trade-off":[158],"between":[159],"arithmetic":[160],"off-chip":[163],"memory":[164],"traffic,":[165],"removing":[166],"primary":[168],"barrier":[169],"efficient":[172],"ViTs":[175],"accelerators.":[178]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-16T00:00:00"}
