{"id":"https://openalex.org/W7151422082","doi":"https://doi.org/10.48550/arxiv.2604.04704","title":"IDIOLEX: Unified and Continuous Representations for Idiolectal and Stylistic Variation","display_name":"IDIOLEX: Unified and Continuous Representations for Idiolectal and Stylistic Variation","publication_year":2026,"publication_date":"2026-04-06","ids":{"openalex":"https://openalex.org/W7151422082","doi":"https://doi.org/10.48550/arxiv.2604.04704"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.04704","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04704","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.04704","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133129080","display_name":"Anjali Kantharuban","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kantharuban, Anjali","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028765069","display_name":"Aarohi Srivastava","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Srivastava, Aarohi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133115748","display_name":"Fahim Faisal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Faisal, Fahim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045507345","display_name":"Orevaoghene Ahia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahia, Orevaoghene","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133097911","display_name":"Antonios Anastasopoulos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anastasopoulos, Antonios","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133086317","display_name":"David Chiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chiang, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133072143","display_name":"Yulia Tsvetkov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tsvetkov, Yulia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133135359","display_name":"Graham Neubig","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Neubig, Graham","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5133129080"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.49059998989105225,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.49059998989105225,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.14030000567436218,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.10499999672174454,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.7383000254631042},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.6312000155448914},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6100000143051147},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.5424000024795532},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4839000105857849},{"id":"https://openalex.org/keywords/style","display_name":"Style (visual arts)","score":0.4828000068664551}],"concepts":[{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.7383000254631042},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7174999713897705},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6959999799728394},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.6312000155448914},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6100000143051147},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5867999792098999},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.5424000024795532},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4839000105857849},{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.4828000068664551},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.46230000257492065},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.2971000075340271},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.295199990272522},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2542000114917755},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.04704","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04704","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.04704","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04704","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.802725076675415,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Existing":[0],"sentence":[1,7,28],"representations":[2,29,94,113],"primarily":[3],"encode":[4],"what":[5],"a":[6,51,60,67,72,133],"says,":[8],"rather":[9],"than":[10],"how":[11],"it":[12],"is":[13,19],"expressed,":[14],"even":[15],"though":[16],"the":[17,42,83,109],"latter":[18],"important":[20],"for":[21,53,102,117,136],"many":[22],"applications.":[23],"In":[24],"contrast,":[25],"we":[26],"develop":[27],"that":[30,56,125],"capture":[31,95],"style":[32,78],"and":[33,79,90,98,104,129,139,152],"dialect,":[34],"decoupled":[35],"from":[36,59],"semantic":[37],"content.":[38],"We":[39,48,81,106],"call":[40],"this":[41],"task":[43],"of":[44,66,75,87,111],"idiolectal":[45],"representation":[46,74],"learning.":[47],"introduce":[49],"IDIOLEX,":[50],"framework":[52],"training":[54,115],"models":[55],"combines":[57],"supervision":[58],"sentence's":[61,68,77],"provenance":[62],"with":[63],"linguistic":[64],"features":[65],"content,":[69],"to":[70,145],"learn":[71],"continuous":[73],"each":[76],"dialect.":[80],"evaluate":[82],"approach":[84],"on":[85],"dialects":[86],"both":[88],"Arabic":[89],"Spanish.":[91],"The":[92],"learned":[93],"meaningful":[96],"variation":[97,131],"transfer":[99],"across":[100],"domains":[101],"analysis":[103],"classification.":[105],"further":[107],"explore":[108],"use":[110],"these":[112],"as":[114,149],"objectives":[116],"stylistically":[118],"aligning":[119],"language":[120],"models.":[121],"Our":[122],"results":[123],"suggest":[124],"jointly":[126],"modeling":[127],"individual":[128],"community-level":[130],"provides":[132],"useful":[134],"perspective":[135],"studying":[137],"idiolect":[138],"supports":[140],"downstream":[141],"applications":[142],"requiring":[143],"sensitivity":[144],"stylistic":[146],"differences,":[147],"such":[148],"developing":[150],"diverse":[151],"accessible":[153],"LLMs.":[154]},"counts_by_year":[],"updated_date":"2026-04-08T06:07:18.267832","created_date":"2026-04-08T00:00:00"}
