{"id":"https://openalex.org/W7160506192","doi":"https://doi.org/10.48550/arxiv.2605.05197","title":"Implicit Representations of Grammaticality in Language Models","display_name":"Implicit Representations of Grammaticality in Language Models","publication_year":2026,"publication_date":"2026-05-06","ids":{"openalex":"https://openalex.org/W7160506192","doi":"https://doi.org/10.48550/arxiv.2605.05197"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.05197","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.05197","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.05197","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135591493","display_name":"Yingshan Susan Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yingshan Susan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003617960","display_name":"Linlu Qiu","orcid":"https://orcid.org/0000-0002-1696-5419"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qiu, Linlu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135629021","display_name":"Zhaofeng Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Zhaofeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5131112038","display_name":"Roger P. LEVY","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Levy, Roger P.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135571562","display_name":"Yoon Jin Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Yoon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.4489000141620636,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.4489000141620636,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1858000010251999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.0771000012755394,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/grammaticality","display_name":"Grammaticality","score":0.9983000159263611},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.7949000000953674},{"id":"https://openalex.org/keywords/grammar","display_name":"Grammar","score":0.4587000012397766},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3677000105381012},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.36059999465942383}],"concepts":[{"id":"https://openalex.org/C2779525943","wikidata":"https://www.wikidata.org/wiki/Q1187300","display_name":"Grammaticality","level":3,"score":0.9983000159263611},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.7949000000953674},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5440000295639038},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5212000012397766},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5134000182151794},{"id":"https://openalex.org/C26022165","wikidata":"https://www.wikidata.org/wiki/Q8091","display_name":"Grammar","level":2,"score":0.4587000012397766},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4124000072479248},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3677000105381012},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.36059999465942383},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.3285999894142151},{"id":"https://openalex.org/C2776818064","wikidata":"https://www.wikidata.org/wiki/Q829903","display_name":"Agreement","level":2,"score":0.305400013923645},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2847999930381775},{"id":"https://openalex.org/C123556308","wikidata":"https://www.wikidata.org/wiki/Q484761","display_name":"Philosophy of language","level":3,"score":0.25360000133514404}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.05197","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.05197","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.05197","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.05197","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7276760935783386}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Grammaticality":[0],"and":[1,28,33,51,87,113,135],"likelihood":[2],"are":[3,14,133],"distinct":[4,63],"notions":[5],"in":[6,36,125,137,162],"human":[7],"language.":[8],"Pretrained":[9],"language":[10,18],"models":[11,16],"(LMs),":[12],"which":[13,126],"probabilistic":[15],"of":[17,75,85,129],"fitted":[19],"to":[20,95,108,121,182],"maximize":[21],"corpus":[22],"likelihood,":[23],"generate":[24],"grammatically":[25],"well-formed":[26],"text":[27,98],"discriminate":[29,48],"well":[30],"between":[31,49],"grammatical":[32,50,86,134],"ungrammatical":[34,52,89],"sentences":[35,53,90],"tightly":[37],"controlled":[38],"minimal":[39,131],"pairs.":[40],"However,":[41],"their":[42,190],"string":[43,65,146,157,173],"probabilities":[44,158],"do":[45,56],"not":[46],"sharply":[47],"overall.":[54],"But":[55],"LMs":[57,180],"implicitly":[58],"acquire":[59,181],"a":[60,79,83,96,130],"grammaticality":[61,105,110,117,160,187],"distinction":[62,188],"from":[64],"probability?":[66],"We":[67,100],"explore":[68],"this":[69,103],"question":[70],"through":[71],"studying":[72],"internal":[73],"representations":[74],"LMs,":[76],"by":[77,92],"training":[78],"linear":[80],"probe":[81,106,141,150,167],"on":[82,159],"dataset":[84],"(synthetic)":[88],"obtained":[91],"applying":[93],"perturbations":[94],"naturalistic":[97],"corpus.":[99],"find":[101],"that":[102,179],"simple":[104],"generalizes":[107],"human-curated":[109],"judgment":[111],"benchmarks":[112,161],"outperforms":[114],"LM":[115],"probability-based":[116],"judgments.":[118],"When":[119],"applied":[120],"semantic":[122],"plausibility":[123],"benchmarks,":[124],"both":[127],"members":[128],"pair":[132],"differ":[136],"only":[138,170],"plausibility,":[139],"the":[140],"however":[142],"performs":[143],"worse":[144],"than":[145],"probability.":[147],"The":[148],"English-trained":[149],"also":[151],"exhibits":[152],"nontrivial":[153],"cross-lingual":[154],"generalization,":[155],"outperforming":[156],"numerous":[163],"other":[164],"languages.":[165],"Additionally,":[166],"scores":[168],"correlate":[169],"weakly":[171],"with":[172],"probabilities.":[174],"These":[175],"results":[176],"collectively":[177],"suggest":[178],"some":[183],"extent":[184],"an":[185],"implicit":[186],"within":[189],"hidden":[191],"layers.":[192]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-08T00:00:00"}
