{"id":"https://openalex.org/W7140164398","doi":"https://doi.org/10.48550/arxiv.2603.20695","title":"Can I guess where you are from? Modeling dialectal morphosyntactic similarities in Brazilian Portuguese","display_name":"Can I guess where you are from? Modeling dialectal morphosyntactic similarities in Brazilian Portuguese","publication_year":2026,"publication_date":"2026-03-21","ids":{"openalex":"https://openalex.org/W7140164398","doi":"https://doi.org/10.48550/arxiv.2603.20695"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.20695","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.20695","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.20695","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Siqueira, Manoel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Siqueira, Manoel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Freitag, Raquel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Freitag, Raquel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11640","display_name":"Linguistic Variation and Morphology","score":0.6797000169754028,"subfield":{"id":"https://openalex.org/subfields/3310","display_name":"Linguistics and Language"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11640","display_name":"Linguistic Variation and Morphology","score":0.6797000169754028,"subfield":{"id":"https://openalex.org/subfields/3310","display_name":"Linguistics and Language"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.09960000216960907,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10034","display_name":"Syntax, Semantics, Linguistic Variation","score":0.04340000078082085,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/brazilian-portuguese","display_name":"Brazilian Portuguese","score":0.7197999954223633},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6176999807357788},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.5920000076293945},{"id":"https://openalex.org/keywords/portuguese","display_name":"Portuguese","score":0.49239999055862427},{"id":"https://openalex.org/keywords/computational-linguistics","display_name":"Computational linguistics","score":0.4487000107765198},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.41280001401901245},{"id":"https://openalex.org/keywords/sociolinguistics","display_name":"Sociolinguistics","score":0.4104999899864197}],"concepts":[{"id":"https://openalex.org/C2778880076","wikidata":"https://www.wikidata.org/wiki/Q750553","display_name":"Brazilian Portuguese","level":3,"score":0.7197999954223633},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.6732000112533569},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6176999807357788},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.5920000076293945},{"id":"https://openalex.org/C35219183","wikidata":"https://www.wikidata.org/wiki/Q5146","display_name":"Portuguese","level":2,"score":0.49239999055862427},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44920000433921814},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.4487000107765198},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4377000033855438},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4129999876022339},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.41280001401901245},{"id":"https://openalex.org/C28519872","wikidata":"https://www.wikidata.org/wiki/Q160845","display_name":"Sociolinguistics","level":2,"score":0.4104999899864197},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4058000147342682},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.39660000801086426},{"id":"https://openalex.org/C2781202465","wikidata":"https://www.wikidata.org/wiki/Q18346297","display_name":"Lexical diversity","level":3,"score":0.384799987077713},{"id":"https://openalex.org/C2992249680","wikidata":"https://www.wikidata.org/wiki/Q315","display_name":"Linguistic diversity","level":2,"score":0.37139999866485596},{"id":"https://openalex.org/C117220453","wikidata":"https://www.wikidata.org/wiki/Q5172842","display_name":"Correlation","level":2,"score":0.35190001130104065},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.3018999993801117},{"id":"https://openalex.org/C2780939345","wikidata":"https://www.wikidata.org/wiki/Q922399","display_name":"European Portuguese","level":3,"score":0.27070000767707825},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C524601802","wikidata":"https://www.wikidata.org/wiki/Q2198157","display_name":"Quantitative linguistics","level":3,"score":0.25519999861717224}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.20695","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.20695","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.20695","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.20695","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.4910387098789215,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"investigates":[2],"morphosyntactic":[3],"covariation":[4,40],"in":[5,71],"Brazilian":[6],"Portuguese":[7],"(BP)":[8],"to":[9,30,38],"assess":[10],"whether":[11],"dialectal":[12,42,62,96],"origin":[13],"can":[14],"be":[15],"inferred":[16],"from":[17],"the":[18,65,80,83,99],"combined":[19],"behavior":[20],"of":[21,85,101],"linguistic":[22],"variables.":[23],"Focusing":[24],"on":[25],"four":[26],"grammatical":[27],"phenomena":[28],"related":[29],"pronouns,":[31],"correlation":[32,48],"and":[33,41,77,90],"clustering":[34,55],"methods":[35],"are":[36],"applied":[37],"model":[39],"distribution.":[43],"The":[44],"results":[45],"indicate":[46],"that":[47,59,94],"captures":[49],"only":[50],"limited":[51],"pairwise":[52],"associations,":[53],"whereas":[54],"reveals":[56],"speaker":[57],"groupings":[58],"reflect":[60],"regional":[61],"patterns.":[63],"Despite":[64],"methodological":[66],"constraints":[67],"imposed":[68],"by":[69],"differences":[70],"sample":[72],"size":[73],"requirements":[74],"between":[75],"sociolinguistics":[76],"computational":[78],"approaches,":[79],"study":[81],"highlights":[82],"importance":[84],"interdisciplinary":[86],"research.":[87],"Developing":[88],"fair":[89],"inclusive":[91],"language":[92],"technologies":[93],"respect":[95],"diversity":[97],"outweighs":[98],"challenges":[100],"integrating":[102],"these":[103],"fields.":[104]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-25T00:00:00"}
