{"id":"https://openalex.org/W7133332671","doi":"https://doi.org/10.48550/arxiv.2603.00958","title":"S-VoCAL: A Dataset and Evaluation Framework for Inferring Speaking Voice Character Attributes in Literature","display_name":"S-VoCAL: A Dataset and Evaluation Framework for Inferring Speaking Voice Character Attributes in Literature","publication_year":2026,"publication_date":"2026-03-01","ids":{"openalex":"https://openalex.org/W7133332671","doi":"https://doi.org/10.48550/arxiv.2603.00958"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.00958","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00958","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.00958","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5099842327","display_name":"Abigail Berthe-Pardo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Berthe-Pardo, Abigail","raw_affiliation_strings":["LORIA, Vand\u0153uvre-l\u00e8s-Nancy, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LORIA, Vand\u0153uvre-l\u00e8s-Nancy, France","institution_ids":["https://openalex.org/I4210121838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113109459","display_name":"Gaspard Michel","orcid":null},"institutions":[{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Michel, Gaspard","raw_affiliation_strings":["LORIA, Vand\u0153uvre-l\u00e8s-Nancy, France","Deezer Research, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LORIA, Vand\u0153uvre-l\u00e8s-Nancy, France","institution_ids":["https://openalex.org/I4210121838"]},{"raw_affiliation_string":"Deezer Research, Paris, France","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123349700","display_name":"Elena V. Epure","orcid":null},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Epure, Elena V.","raw_affiliation_strings":["Deezer Research, Paris, France","Idiap Research Institute, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Deezer Research, Paris, France","institution_ids":[]},{"raw_affiliation_string":"Idiap Research Institute, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015868219","display_name":"Christophe Cerisara","orcid":null},"institutions":[{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Cerisara, Christophe","raw_affiliation_strings":["LORIA, Vand\u0153uvre-l\u00e8s-Nancy, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LORIA, Vand\u0153uvre-l\u00e8s-Nancy, France","institution_ids":["https://openalex.org/I4210121838"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5099842327"],"corresponding_institution_ids":["https://openalex.org/I4210121838"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.23770000040531158,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.23770000040531158,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.11720000207424164,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.06949999928474426,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.8033000230789185},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.7699000239372253},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.695900022983551},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.6643999814987183},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6413999795913696},{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.6014999747276306},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5766000151634216},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.516700029373169}],"concepts":[{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.8033000230789185},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.7699000239372253},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7383000254631042},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.695900022983551},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.6643999814987183},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6413999795913696},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.6014999747276306},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5766000151634216},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5264999866485596},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.516700029373169},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5121999979019165},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5095999836921692},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4018999934196472},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.3343000113964081},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.3314000070095062},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.33000001311302185},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.28859999775886536},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.2881999909877777},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.2793000042438507},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2667999863624573},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.00958","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00958","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.00958","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00958","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.4579973518848419},{"display_name":"Gender equality","id":"https://metadata.un.org/sdg/5","score":0.43106842041015625}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"With":[0],"recent":[1,149],"advances":[2],"in":[3,23,55,66,80,98,121],"Text-to-Speech":[4],"(TTS)":[5],"systems,":[6],"synthetic":[7,24],"audiobook":[8],"narration":[9,25],"has":[10],"seen":[11],"increased":[12],"interest,":[13],"reaching":[14],"unprecedented":[15],"levels":[16],"of":[17,48,64,111,138,158,171],"naturalness.":[18],"However,":[19],"larger":[20],"gaps":[21],"remain":[22],"systems'":[26,89],"ability":[27],"to":[28,41,51,86,107,168],"impersonate":[29],"fictional":[30,53,113],"characters,":[31],"and":[32,103,124,141,202],"convey":[33],"complex":[34,62],"emotions":[35],"or":[36,76,188,197],"prosody.":[37],"A":[38],"promising":[39],"direction":[40],"enhance":[42],"character":[43,114,173],"identification":[44],"is":[45],"the":[46,100,109,136,156,169,179],"assignment":[47],"plausible":[49],"voices":[50],"each":[52,139],"characters":[54],"a":[56,71,143,162],"book.":[57],"This":[58],"step":[59],"typically":[60],"requires":[61,82],"inference":[63,110],"attributes":[65,119,184],"book-length":[67],"contexts,":[68],"such":[69,185,194],"as":[70,186,195],"character's":[72],"age,":[73],"gender,":[74],"origin":[75],"physical":[77],"health,":[78],"which":[79],"turns":[81],"dedicated":[83,106],"benchmark":[84],"datasets":[85],"evaluate":[87,108],"extraction":[88],"performances.":[90],"We":[91,154],"present":[92],"S-VoCAL":[93,116,159],"(Speaking":[94],"Voice":[95],"Character":[96],"Attributes":[97],"Literature),":[99],"first":[101],"dataset":[102,201],"evaluation":[104,133,203],"framework":[105,134],"voice-related":[112],"attributes.":[115,174],"entails":[117],"8":[118],"grounded":[120],"sociophonetic":[122],"studies,":[123],"952":[125],"character-book":[126],"pairs":[127],"derived":[128],"from":[129],"Project":[130],"Gutenberg.":[131],"Its":[132],"addresses":[135],"particularities":[137],"attribute,":[140],"includes":[142],"novel":[144],"similarity":[145],"metric":[146],"based":[147],"on":[148,192],"Large":[150],"Language":[151],"Models":[152],"embeddings.":[153],"demonstrate":[155],"applicability":[157],"by":[160],"applying":[161],"simple":[163],"Retrieval-Augmented":[164],"Generation":[165],"(RAG)":[166],"pipeline":[167,181],"task":[170],"inferring":[172],"Our":[175],"results":[176],"suggest":[177],"that":[178],"RAG":[180],"reliably":[182],"infers":[183],"Age":[187],"Gender,":[189],"but":[190],"struggles":[191],"others":[193],"Origin":[196],"Physical":[198],"Health.":[199],"The":[200],"code":[204],"are":[205],"available":[206],"at":[207],"https://github.com/AbigailBerthe/S-VoCAL":[208],".":[209]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-04T00:00:00"}
