{"id":"https://openalex.org/W7128491348","doi":"https://doi.org/10.48550/arxiv.2602.07547","title":"Linguistic properties and model scale in brain encoding: from small to compressed language models","display_name":"Linguistic properties and model scale in brain encoding: from small to compressed language models","publication_year":2026,"publication_date":"2026-02-07","ids":{"openalex":"https://openalex.org/W7128491348","doi":"https://doi.org/10.48550/arxiv.2602.07547"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.07547","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125483826","display_name":"Subba Reddy Oota","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Oota, Subba Reddy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084991192","display_name":"Vijay Rowtula","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rowtula, Vijay","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125533937","display_name":"Satya Sai Srinath Namburi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Namburi, Satya Sai Srinath","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032698955","display_name":"Khushbu Pahwa","orcid":"https://orcid.org/0009-0009-6976-6120"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pahwa, Khushbu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002245577","display_name":"Anant Khandelwal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khandelwal, Anant","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125543021","display_name":"Manish Gupta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gupta, Manish","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125570051","display_name":"Tanmoy Chakraborty","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chakraborty, Tanmoy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5000175925","display_name":"B.Naga raju","orcid":"https://orcid.org/0000-0002-8291-031X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Raju, Bapi S.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5125483826"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10465","display_name":"Neurobiology of Language and Bilingualism","score":0.607699990272522,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10465","display_name":"Neurobiology of Language and Bilingualism","score":0.607699990272522,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10094","display_name":"Epilepsy research and treatment","score":0.06750000268220901,"subfield":{"id":"https://openalex.org/subfields/2738","display_name":"Psychiatry and Mental health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.03590000048279762,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.7379000186920166},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.5450000166893005},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4390999972820282},{"id":"https://openalex.org/keywords/brain-activity-and-meditation","display_name":"Brain activity and meditation","score":0.4075999855995178},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.3903000056743622},{"id":"https://openalex.org/keywords/neurolinguistics","display_name":"Neurolinguistics","score":0.38449999690055847},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.37950000166893005},{"id":"https://openalex.org/keywords/dissociation","display_name":"Dissociation (chemistry)","score":0.3617999851703644}],"concepts":[{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.7379000186920166},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6983000040054321},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.5450000166893005},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5339999794960022},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49950000643730164},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4390999972820282},{"id":"https://openalex.org/C120843803","wikidata":"https://www.wikidata.org/wiki/Q4955807","display_name":"Brain activity and meditation","level":3,"score":0.4075999855995178},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.3903000056743622},{"id":"https://openalex.org/C155614148","wikidata":"https://www.wikidata.org/wiki/Q215948","display_name":"Neurolinguistics","level":4,"score":0.38449999690055847},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.37950000166893005},{"id":"https://openalex.org/C102931765","wikidata":"https://www.wikidata.org/wiki/Q189673","display_name":"Dissociation (chemistry)","level":2,"score":0.3617999851703644},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.3580999970436096},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3384000062942505},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.30239999294281006},{"id":"https://openalex.org/C60048249","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntax","level":2,"score":0.3003999888896942},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.28769999742507935},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.28189998865127563},{"id":"https://openalex.org/C64249296","wikidata":"https://www.wikidata.org/wiki/Q5250411","display_name":"Deep linguistic processing","level":2,"score":0.2800000011920929},{"id":"https://openalex.org/C2984127161","wikidata":"https://www.wikidata.org/wiki/Q969316","display_name":"Neural activity","level":2,"score":0.2791000008583069},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.27720001339912415},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.27079999446868896},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.2703999876976013},{"id":"https://openalex.org/C58693492","wikidata":"https://www.wikidata.org/wiki/Q551875","display_name":"Neuroimaging","level":2,"score":0.26600000262260437},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.26600000262260437},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.26190000772476196},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2542000114917755}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.07547","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.07547","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.07547","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.07547","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6769781112670898,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"work":[1],"has":[2],"shown":[3],"that":[4,113],"scaling":[5,195],"large":[6],"language":[7,87,102,131,202],"models":[8,33,88,125,199],"(LLMs)":[9],"improves":[10],"their":[11],"alignment":[12,134,179],"with":[13,148],"human":[14],"brain":[15,40,80,117,163,172,178],"activity,":[16],"yet":[17,171],"it":[18],"remains":[19,174],"unclear":[20],"what":[21,54],"drives":[22],"these":[23],"gains":[24],"and":[25,39,76,90,94,142,162,169,185,196],"which":[26],"representational":[27],"properties":[28],"are":[29,43],"responsible.":[30],"Although":[31],"larger":[32,121],"often":[34],"yield":[35],"better":[36],"task":[37,160],"performance":[38,161],"alignment,":[41],"they":[42],"increasingly":[44],"difficult":[45],"to":[46,61,108,138,188],"analyze":[47],"mechanistically.":[48],"This":[49],"raises":[50],"a":[51,151,157],"fundamental":[52],"question:":[53],"is":[55,135,186],"the":[56],"minimal":[57],"model":[58,74,105,183],"capacity":[59],"required":[60],"capture":[62],"brain-relevant":[63],"representations?":[64],"To":[65],"address":[66],"this":[67],"question,":[68],"we":[69,111],"systematically":[70],"investigate":[71],"how":[72],"constraining":[73],"scale":[75],"numerical":[77],"precision":[78],"affects":[79],"alignment.":[81],"We":[82],"compare":[83],"full-precision":[84],"LLMs,":[85,122],"small":[86],"(SLMs),":[89],"compressed":[91],"variants":[92],"(quantized":[93],"pruned)":[95],"by":[96],"predicting":[97],"fMRI":[98],"responses":[99],"during":[100],"naturalistic":[101],"comprehension.":[103],"Across":[104],"families":[106],"up":[107],"14B":[109],"parameters,":[110],"find":[112],"3B":[114],"SLMs":[115],"achieve":[116],"predictivity":[118,173],"indistinguishable":[119],"from":[120],"whereas":[123],"1B":[124],"degrade":[126],"substantially,":[127],"particularly":[128],"in":[129],"semantic":[130],"regions.":[132],"Brain":[133],"remarkably":[136],"robust":[137],"compression:":[139],"most":[140],"quantization":[141],"pruning":[143],"methods":[144],"preserve":[145],"neural":[146,194],"predictivity,":[147],"GPTQ":[149],"as":[150],"consistent":[152],"exception.":[153],"Linguistic":[154],"probing":[155],"reveals":[156],"dissociation":[158],"between":[159],"predictivity:":[164],"compression":[165],"degrades":[166],"discourse,":[167],"syntax,":[168],"morphology,":[170],"largely":[175],"unchanged.":[176],"Overall,":[177],"saturates":[180],"at":[181],"modest":[182],"scales":[184],"resilient":[187],"compression,":[189],"challenging":[190],"common":[191],"assumptions":[192],"about":[193],"motivating":[197],"compact":[198],"for":[200],"brain-aligned":[201],"modeling.":[203]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-11T00:00:00"}
