{"id":"https://openalex.org/W7131631842","doi":"https://doi.org/10.48550/arxiv.2602.21750","title":"From Words to Amino Acids: Does the Curse of Depth Persist?","display_name":"From Words to Amino Acids: Does the Curse of Depth Persist?","publication_year":2026,"publication_date":"2026-02-25","ids":{"openalex":"https://openalex.org/W7131631842","doi":"https://doi.org/10.48550/arxiv.2602.21750"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.21750","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126909931","display_name":"Aleena Siji","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Siji, Aleena","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018101784","display_name":"Amir Mohammad Karimi Mamaghan","orcid":"https://orcid.org/0000-0002-6820-948X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mamaghan, Amir Mohammad Karimi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058626028","display_name":"Ferdinand Kapl","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kapl, Ferdinand","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126944195","display_name":"Tobias H\u00f6ppe","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"H\u00f6ppe, Tobias","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126906324","display_name":"Emmanouil Angelis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Angelis, Emmanouil","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008956185","display_name":"Andrea Dittadi","orcid":"https://orcid.org/0000-0002-0670-9251"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dittadi, Andrea","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086420353","display_name":"Maurice Brenner","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brenner, Maurice","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126907166","display_name":"Michael Heinzinger","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Heinzinger, Michael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045975901","display_name":"Karl Henrik Johansson","orcid":"https://orcid.org/0000-0001-9940-5929"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Johansson, Karl Henrik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042242259","display_name":"Kaitlin Maile","orcid":"https://orcid.org/0000-0001-5867-6976"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maile, Kaitlin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"von Oswald, Johannes","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"von Oswald, Johannes","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125368956","display_name":"Stefan Bauer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bauer, Stefan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5126909931"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.21070000529289246,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.21070000529289246,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.09790000319480896,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11642","display_name":"Genomics and Rare Diseases","score":0.06400000303983688,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inefficiency","display_name":"Inefficiency","score":0.604200005531311},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5943999886512756},{"id":"https://openalex.org/keywords/curse","display_name":"Curse","score":0.590399980545044},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4975999891757965},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.48330000042915344},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.44279998540878296},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.4390999972820282}],"concepts":[{"id":"https://openalex.org/C2778869765","wikidata":"https://www.wikidata.org/wiki/Q6028363","display_name":"Inefficiency","level":2,"score":0.604200005531311},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5943999886512756},{"id":"https://openalex.org/C2780273121","wikidata":"https://www.wikidata.org/wiki/Q109411","display_name":"Curse","level":2,"score":0.590399980545044},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5127999782562256},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4975999891757965},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.48330000042915344},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4593000113964081},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.44279998540878296},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.44269999861717224},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.4390999972820282},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.3837999999523163},{"id":"https://openalex.org/C119898033","wikidata":"https://www.wikidata.org/wiki/Q3433888","display_name":"Ensemble forecasting","level":2,"score":0.37310001254081726},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.34700000286102295},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3262999951839447},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3197000026702881},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.31869998574256897},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.29159998893737793},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.2847999930381775},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2547999918460846}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.21750","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.21750","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.21750","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.21750","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Protein":[0],"language":[1,23],"models":[2,24,91],"(PLMs)":[3],"have":[4],"become":[5],"widely":[6,89],"adopted":[7],"as":[8,30,105],"general-purpose":[9],"models,":[10,148],"demonstrating":[11],"strong":[12],"performance":[13],"in":[14,85,168,194],"protein":[15,101],"engineering":[16],"and":[17,43,95,103,126,129,144,191,219],"de":[18],"novo":[19],"design.":[20],"Like":[21],"large":[22,161],"(LLMs),":[25],"they":[26],"are":[27,44,92,97],"typically":[28],"trained":[29],"deep":[31],"transformers":[32],"with":[33,135],"next-token":[34],"or":[35],"masked-token":[36],"prediction":[37],"objectives":[38],"on":[39,52,158,215],"massive":[40],"sequence":[41,102],"corpora":[42],"scaled":[45],"by":[46],"increasing":[47],"model":[48,121],"depth.":[49],"Recent":[50],"work":[51,214],"autoregressive":[53],"LLMs":[54],"has":[55],"identified":[56],"the":[57,67,75,174,182],"Curse":[58],"of":[59,77,115,141,163,171,181,209],"Depth:":[60],"many":[61,88],"later":[62],"layers":[63,176],"contribute":[64],"little":[65],"to":[66],"final":[68,183],"output":[69],"predictions.":[70],"These":[71,185],"findings":[72,157],"naturally":[73],"raise":[74],"question":[76],"whether":[78],"a":[79,112,138,160,169,206],"similar":[80],"depth":[81,113,136,203],"inefficiency":[82,204],"also":[83,192],"appears":[84],"PLMs,":[86,211],"where":[87],"used":[90],"not":[93],"autoregressive,":[94,124],"some":[96],"multimodal,":[98],"accepting":[99],"both":[100],"structure":[104],"input.":[106],"In":[107],"this":[108],"work,":[109],"we":[110,149],"present":[111],"analysis":[114],"seven":[116],"popular":[117],"PLM":[118],"families":[119],"across":[120],"scales,":[122],"spanning":[123],"masked,":[125],"diffusion":[127],"objectives,":[128],"quantify":[130],"how":[131],"layer":[132],"contributions":[133],"evolve":[134],"using":[137],"unified":[139],"set":[140],"probing-,":[142],"perturbation-,":[143],"downstream-evaluation":[145],"measurements.":[146],"Across":[147],"observe":[150],"consistent":[151],"depth-dependent":[152],"patterns":[153],"that":[154,202],"extend":[155],"prior":[156],"LLMs:":[159],"fraction":[162],"task-relevant":[164],"computation":[165],"is":[166,205],"concentrated":[167],"subset":[170],"layers,":[172],"while":[173],"remaining":[175],"mainly":[177],"provide":[178],"incremental":[179],"refinement":[180],"prediction.":[184],"trends":[186],"persist":[187],"beyond":[188],"sequence-only":[189],"settings":[190],"appear":[193],"multimodal":[195],"PLMs.":[196],"Taken":[197],"together,":[198],"our":[199],"results":[200],"suggest":[201],"common":[207],"feature":[208],"modern":[210],"motivating":[212],"future":[213],"more":[216],"depth-efficient":[217],"architectures":[218],"training":[220],"methods.":[221]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-05-16T08:24:45.110214","created_date":"2026-02-27T00:00:00"}
