{"id":"https://openalex.org/W7140123509","doi":"https://doi.org/10.48550/arxiv.2603.19940","title":"Hybrid topic modelling for computational close reading: Mapping narrative themes in Pushkin's Evgenij Onegin","display_name":"Hybrid topic modelling for computational close reading: Mapping narrative themes in Pushkin's Evgenij Onegin","publication_year":2026,"publication_date":"2026-03-20","ids":{"openalex":"https://openalex.org/W7140123509","doi":"https://doi.org/10.48550/arxiv.2603.19940"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.19940","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19940","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.19940","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130370727","display_name":"Angelo Maria Sabatini","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sabatini, Angelo Maria","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5130370727"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.3109000027179718,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.3109000027179718,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.11869999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.08590000122785568,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.8083000183105469},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.7760000228881836},{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.6746000051498413},{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.6134999990463257},{"id":"https://openalex.org/keywords/thematic-map","display_name":"Thematic map","score":0.5223000049591064},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.47769999504089355},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.41659998893737793},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4108999967575073}],"concepts":[{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.8083000183105469},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.7760000228881836},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7222999930381775},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.6746000051498413},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6377000212669373},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6269000172615051},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.6134999990463257},{"id":"https://openalex.org/C93692415","wikidata":"https://www.wikidata.org/wiki/Q1502030","display_name":"Thematic map","level":2,"score":0.5223000049591064},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.47769999504089355},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.41659998893737793},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4108999967575073},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.3910999894142151},{"id":"https://openalex.org/C2778109090","wikidata":"https://www.wikidata.org/wiki/Q7781195","display_name":"Thematic structure","level":2,"score":0.38679999113082886},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.3799000084400177},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.36079999804496765},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.334199994802475},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.3231000006198883},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.32170000672340393},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3203999996185303},{"id":"https://openalex.org/C554936623","wikidata":"https://www.wikidata.org/wiki/Q199657","display_name":"Reading (process)","level":2,"score":0.3197000026702881},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.30469998717308044},{"id":"https://openalex.org/C78015137","wikidata":"https://www.wikidata.org/wiki/Q847829","display_name":"Narrative structure","level":3,"score":0.29829999804496765},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.2768000066280365},{"id":"https://openalex.org/C69738355","wikidata":"https://www.wikidata.org/wiki/Q1228929","display_name":"Linear discriminant analysis","level":2,"score":0.27399998903274536},{"id":"https://openalex.org/C22354355","wikidata":"https://www.wikidata.org/wiki/Q422009","display_name":"Partial least squares regression","level":2,"score":0.26829999685287476}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.19940","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19940","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.19940","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19940","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.5822178721427917}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"study":[1],"presents":[2],"a":[3,37,61,88,97,147,184,191],"hybrid":[4],"topic":[5],"modelling":[6],"framework":[7,145],"for":[8],"computational":[9,148],"literary":[10,141,199],"analysis":[11],"that":[12,106],"integrates":[13],"Latent":[14],"Dirichlet":[15],"Allocation":[16],"(LDA)":[17],"with":[18,130],"sparse":[19],"Partial":[20],"Least":[21],"Squares":[22],"Discriminant":[23],"Analysis":[24],"(sPLS-DA)":[25],"to":[26,121,196],"model":[27],"thematic":[28,127,161],"structure":[29],"and":[30,55,80,134],"longitudinal":[31],"dynamics":[32],"in":[33,47,60,201],"narrative":[34,123],"poetry.":[35],"As":[36],"case":[38],"study,":[39],"we":[40],"analyse":[41],"Evgenij":[42],"Onegin-Aleksandr":[43],"S.":[44],"Pushkin's":[45],"novel":[46],"verse-using":[48],"an":[49],"Italian":[50],"translation,":[51,187],"testing":[52],"whether":[53],"unsupervised":[54],"supervised":[56,98],"lexical":[57,104],"structures":[58],"converge":[59],"small-corpus":[62,86],"setting.":[63],"The":[64],"poetic":[65,165],"text":[66],"is":[67,92],"segmented":[68],"into":[69],"thirty-five":[70],"documents":[71],"of":[72,112,150,163],"lemmatised":[73,186],"content":[74],"words,":[75],"from":[76],"which":[77],"five":[78],"stable":[79],"interpretable":[81],"topics":[82],"emerge.":[83],"To":[84],"address":[85],"instability,":[87],"multi-seed":[89],"consensus":[90],"protocol":[91],"adopted.":[93],"Using":[94],"sPLS-DA":[95],"as":[96,172],"probe":[99],"enhances":[100],"interpretability":[101],"by":[102],"identifying":[103],"markers":[105],"refine":[107],"each":[108],"theme.":[109],"Narrative":[110],"hubs-groups":[111],"contiguous":[113],"stanzas":[114],"marking":[115],"key":[116],"episodes-extend":[117],"the":[118,122,131,143,188],"bag-of-words":[119],"approach":[120,189],"level,":[124],"revealing":[125],"how":[126,154],"mixtures":[128],"align":[129],"poem's":[132],"emotional":[133],"structural":[135],"arc.":[136],"Rather":[137],"than":[138],"replacing":[139],"traditional":[140],"interpretation,":[142],"proposed":[144],"offers":[146],"form":[149],"close":[151],"reading,":[152],"illustrating":[153],"lightweight":[155],"probabilistic":[156],"models":[157],"can":[158],"yield":[159],"reproducible":[160],"maps":[162],"complex":[164],"narratives,":[166],"even":[167],"when":[168],"stylistic":[169],"features":[170],"such":[171],"metre,":[173],"phonology,":[174],"or":[175],"native":[176],"morphology":[177],"are":[178],"abstracted":[179],"away.":[180],"Despite":[181],"relying":[182],"on":[183],"single":[185],"provides":[190],"transparent":[192],"methodological":[193],"template":[194],"applicable":[195],"other":[197],"high-density":[198],"texts":[200],"comparative":[202],"studies.":[203]},"counts_by_year":[],"updated_date":"2026-03-24T06:04:31.470712","created_date":"2026-03-24T00:00:00"}
