{"id":"https://openalex.org/W7161579476","doi":"https://doi.org/10.48550/arxiv.2605.15649","title":"Towards Code-Oriented LM Embeddings for Surrogate-Assisted Neural Architecture Search","display_name":"Towards Code-Oriented LM Embeddings for Surrogate-Assisted Neural Architecture Search","publication_year":2026,"publication_date":"2026-05-15","ids":{"openalex":"https://openalex.org/W7161579476","doi":"https://doi.org/10.48550/arxiv.2605.15649"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.15649","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15649","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.15649","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136425546","display_name":"Pranav Somu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Somu, Pranav","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086056935","display_name":"Advay Balakrishnan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Balakrishnan, Advay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136422674","display_name":"Stepan Kravtsov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kravtsov, Stepan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136413610","display_name":"Aaron McDaniel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McDaniel, Aaron","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5079412677","display_name":"Jason Zutty","orcid":"https://orcid.org/0000-0001-7977-1454"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zutty, Jason","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.20550000667572021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.20550000667572021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.13410000503063202,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.09430000185966492,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7271000146865845},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.6040999889373779},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.570900022983551},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5669000148773193},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5080000162124634},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4814000129699707},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.44519999623298645},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.36820000410079956},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3659000098705292}],"concepts":[{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7271000146865845},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7195000052452087},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.6040999889373779},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.597599983215332},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.570900022983551},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5669000148773193},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5080000162124634},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4814000129699707},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.44519999623298645},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4050000011920929},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.38960000872612},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.36820000410079956},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3659000098705292},{"id":"https://openalex.org/C125583679","wikidata":"https://www.wikidata.org/wiki/Q755673","display_name":"Search algorithm","level":2,"score":0.3644999861717224},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.3278000056743622},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.32749998569488525},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.32519999146461487},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.31209999322891235},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3091999888420105},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.28839999437332153},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.28209999203681946},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2808000147342682},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.27869999408721924},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.27079999446868896},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.2628999948501587},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.2531999945640564}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.15649","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15649","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.15649","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15649","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.5722661018371582,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Developing":[0],"effective":[1],"surrogates":[2],"(performance":[3],"predictors)":[4],"for":[5,133,142,146,189],"Neural":[6],"Architecture":[7],"Search":[8],"(NAS)":[9],"typically":[10],"requires":[11],"expensive":[12],"fine-tuning":[13],"or":[14],"the":[15,28,67,91,126,151,160,164],"engineering":[16],"of":[17,31,159],"complex":[18],"representations.":[19],"We":[20,78,117],"propose":[21],"a":[22,74,147,184],"low-cost":[23],"embedding":[24,84],"strategy":[25],"that":[26,49,98],"leverages":[27],"inductive":[29],"bias":[30],"Language":[32],"Models":[33],"(LMs)":[34],"to":[35,82,155],"eliminate":[36],"these":[37,179],"overheads.":[38],"By":[39],"representing":[40],"architectures":[41],"as":[42,53,177,183],"PyTorch":[43],"class":[44],"definition":[45],"text,":[46],"we":[47],"demonstrate":[48],"off-the-shelf":[50],"LMs":[51],"act":[52],"competitive":[54],"feature":[55],"extractors":[56],"without":[57],"NAS-specialized":[58],"fine-tuning.":[59],"The":[60],"final":[61],"predictor":[62],"is":[63],"constructed":[64],"by":[65],"passing":[66],"extracted":[68],"Code-Oriented":[69],"LM":[70],"Embeddings":[71],"(COLE)":[72],"through":[73],"lightweight":[75],"regression":[76],"head.":[77],"also":[79,118],"investigate":[80],"strategies":[81],"improve":[83],"quality":[85],"and":[86,93,186],"utilization.":[87],"Our":[88],"experiments":[89],"on":[90],"NAS-Bench-201":[92],"einspace":[94],"search":[95,124,165],"spaces":[96],"reveal":[97],"raw":[99],"code":[100],"inputs":[101],"yield":[102],"higher":[103],"predictive":[104],"performance":[105],"than":[106],"other":[107],"text-based":[108],"encodings":[109,139],"(e.g.,":[110],"ONNX-to-text":[111],"encodings)":[112],"when":[113],"using":[114,125],"frozen":[115],"LMs.":[116],"observe":[119],"COLE":[120,141,182],"drives":[121],"superior":[122],"surrogate-assisted":[123],"BANANAS":[127],"algorithm":[128],"in":[129,150,163],"NAS-Bench-201.":[130],"When":[131],"optimizing":[132],"CIFAR-100":[134],"performance,":[135],"replacing":[136],"structural":[137],"path":[138],"with":[140],"architecture":[143,162,173],"representation":[144],"allows":[145],"34%":[148],"decrease":[149],"evaluation":[152],"budget":[153],"required":[154],"reach":[156],"within":[157],"1%":[158],"fittest":[161],"space":[166],"(by":[167],"test":[168],"accuracy).":[169],"As":[170],"any":[171],"neural":[172],"can":[174],"be":[175],"represented":[176],"code,":[178],"findings":[180],"establish":[181],"versatile":[185],"efficient":[187],"foundation":[188],"advancing":[190],"NAS.":[191]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-19T00:00:00"}
