{"id":"https://openalex.org/W7139119199","doi":"https://doi.org/10.1609/aaai.v40i39.40568","title":"Positional Cognitive Specialization: Where Do LLMs Learn to Comprehend and Speak Your Language?","display_name":"Positional Cognitive Specialization: Where Do LLMs Learn to Comprehend and Speak Your Language?","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7139119199","doi":"https://doi.org/10.1609/aaai.v40i39.40568"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i39.40568","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i39.40568","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/40568/44529","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/40568/44529","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130049142","display_name":"Luis Frentzen Salim","orcid":null},"institutions":[{"id":"https://openalex.org/I4210098366","display_name":"Institute of Information Science, Academia Sinica","ror":"https://ror.org/00z83z196","country_code":"TW","type":"facility","lineage":["https://openalex.org/I4210098366","https://openalex.org/I84653119"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Luis Frentzen Salim","raw_affiliation_strings":["Institute of Information Science, Academia Sinica\nDepartment of Computer Science and Information Engineering, National Taiwan University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"Institute of Information Science, Academia Sinica\nDepartment of Computer Science and Information Engineering, National Taiwan University of Science and Technology","institution_ids":["https://openalex.org/I4210098366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129785815","display_name":"Lun-Wei Ku","orcid":null},"institutions":[{"id":"https://openalex.org/I4210098366","display_name":"Institute of Information Science, Academia Sinica","ror":"https://ror.org/00z83z196","country_code":"TW","type":"facility","lineage":["https://openalex.org/I4210098366","https://openalex.org/I84653119"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Lun-Wei Ku","raw_affiliation_strings":["Institute of Information Science, Academia Sinica"],"affiliations":[{"raw_affiliation_string":"Institute of Information Science, Academia Sinica","institution_ids":["https://openalex.org/I4210098366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030897009","display_name":"Hsing-Kuo Pao","orcid":"https://orcid.org/0000-0002-5518-9475"},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Hsing-Kuo Kenneth Pao","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Taiwan University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Taiwan University of Science and Technology","institution_ids":["https://openalex.org/I154864474"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5130049142"],"corresponding_institution_ids":["https://openalex.org/I4210098366"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.98715203,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"39","first_page":"32875","last_page":"32883"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.29899999499320984,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.29899999499320984,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1964000016450882,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.07639999687671661,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.620199978351593},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.5303999781608582},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.48899999260902405},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.42640000581741333},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4075999855995178},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.4041999876499176},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.3476000130176544},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.34459999203681946},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.3278000056743622}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6345999836921692},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.620199978351593},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.5631999969482422},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.5303999781608582},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.48899999260902405},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4478999972343445},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.42640000581741333},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4075999855995178},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.4041999876499176},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.3873000144958496},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3476000130176544},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.34459999203681946},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3411000072956085},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.3278000056743622},{"id":"https://openalex.org/C2777723229","wikidata":"https://www.wikidata.org/wiki/Q4367921","display_name":"Learnability","level":2,"score":0.3176000118255615},{"id":"https://openalex.org/C108154423","wikidata":"https://www.wikidata.org/wiki/Q1469792","display_name":"Salience (neuroscience)","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C150681269","wikidata":"https://www.wikidata.org/wiki/Q2380771","display_name":"Cognitive style","level":3,"score":0.30239999294281006},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.299699991941452},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2913999855518341},{"id":"https://openalex.org/C43091099","wikidata":"https://www.wikidata.org/wiki/Q1067788","display_name":"Through-the-lens metering","level":3,"score":0.2881999909877777},{"id":"https://openalex.org/C171041071","wikidata":"https://www.wikidata.org/wiki/Q36870","display_name":"First language","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C20854674","wikidata":"https://www.wikidata.org/wiki/Q4386060","display_name":"Cognitive architecture","level":3,"score":0.2858999967575073},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.27720001339912415},{"id":"https://openalex.org/C2780035574","wikidata":"https://www.wikidata.org/wiki/Q30081","display_name":"Multilingualism","level":2,"score":0.2768000066280365},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2667999863624573},{"id":"https://openalex.org/C21963081","wikidata":"https://www.wikidata.org/wiki/Q11337567","display_name":"Working memory","level":3,"score":0.2624000012874603},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.25519999861717224},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.25459998846054077},{"id":"https://openalex.org/C94922259","wikidata":"https://www.wikidata.org/wiki/Q33215","display_name":"Constructed language","level":2,"score":0.25119999051094055},{"id":"https://openalex.org/C74672266","wikidata":"https://www.wikidata.org/wiki/Q815859","display_name":"Language acquisition","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i39.40568","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i39.40568","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/40568/44529","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i39.40568","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i39.40568","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/40568/44529","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7139119199.pdf","grobid_xml":"https://content.openalex.org/works/W7139119199.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Adapting":[0],"large":[1],"language":[2,16,73,99,216],"models":[3,17,41],"(LLMs)":[4],"to":[5,26,202],"new":[6,19,53,208],"languages":[7,20,54,209],"is":[8,24,177],"an":[9],"expensive":[10],"and":[11,21,77,90,110,135,210,214],"opaque":[12],"process.":[13],"Understanding":[14],"how":[15,39,88,205],"acquire":[18,52],"multilingual":[22,33,43],"abilities":[23],"key":[25],"achieve":[27],"efficient":[28],"adaptation.":[29],"Prior":[30],"work":[31],"on":[32,38,62,83,114],"interpretability":[34],"research":[35],"focuses":[36],"primarily":[37],"trained":[40],"process":[42],"instructions,":[44],"leaving":[45],"unexplored":[46],"the":[47,66,107,115,143,155,163],"mechanisms":[48],"through":[49,65],"which":[50,176],"they":[51],"during":[55],"training.":[56],"We":[57,138],"investigate":[58],"these":[59],"training":[60],"dynamics":[61],"decoder-only":[63],"transformers":[64],"lens":[67],"of":[68,97],"two":[69],"functional":[70],"cognitive":[71],"specializations:":[72],"perception":[74],"(input":[75],"comprehension)":[76],"production":[78],"(output":[79],"generation).":[80],"Through":[81],"experiments":[82],"low-resource":[84,181],"languages,":[85],"we":[86,119],"demonstrate":[87],"perceptual":[89],"productive":[91],"specialization":[92,117],"emerges":[93],"in":[94],"different":[95],"regions":[96],"a":[98,122,132],"model":[100],"by":[101,129],"running":[102],"layer":[103],"ablation":[104],"sweeps":[105],"from":[106,154],"model\u2019s":[108],"input":[109],"output":[111],"directions.":[112],"Based":[113],"observed":[116],"patterns,":[118],"propose":[120],"CogSym,":[121],"layer-wise":[123],"heuristic":[124],"that":[125,140],"enables":[126],"effective":[127],"adaptation":[128],"exclusively":[130],"finetuning":[131,157],"few":[133],"early":[134],"late":[136],"layers.":[137],"show":[139],"tuning":[141],"only":[142],"25%":[144],"outermost":[145],"layers":[146],"achieves":[147],"downstream":[148],"task":[149],"performance":[150,186],"within":[151],"2\u20133%":[152],"deviation":[153],"full":[156,196],"baseline.":[158],"Unlike":[159],"similar":[160],"layer-selection":[161],"methods,":[162],"proposed":[164],"method":[165],"requires":[166],"no":[167],"extra":[168],"data":[169],"or":[170],"computation":[171],"while":[172],"retaining":[173],"comparable":[174],"performance,":[175],"especially":[178],"beneficial":[179],"for":[180],"languages.":[182],"CogSym":[183],"yields":[184],"consistent":[185],"with":[187],"adapter":[188],"methods":[189],"such":[190],"as":[191],"LoRA,":[192],"showcasing":[193],"generalization":[194],"beyond":[195],"finetuning.":[197],"These":[198],"findings":[199],"provide":[200],"insights":[201],"better":[203],"understand":[204],"LLMs":[206],"learn":[207],"push":[211],"toward":[212],"accessible":[213],"inclusive":[215],"modeling.":[217]},"counts_by_year":[],"updated_date":"2026-03-20T20:54:20.808490","created_date":"2026-03-20T00:00:00"}
