{"id":"https://openalex.org/W7130338329","doi":"https://doi.org/10.1007/s13278-026-01584-6","title":"Taggus: an automated pipeline for the extraction of characters\u2019 social networks from portuguese fiction literature","display_name":"Taggus: an automated pipeline for the extraction of characters\u2019 social networks from portuguese fiction literature","publication_year":2026,"publication_date":"2026-02-18","ids":{"openalex":"https://openalex.org/W7130338329","doi":"https://doi.org/10.1007/s13278-026-01584-6"},"language":"en","primary_location":{"id":"doi:10.1007/s13278-026-01584-6","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s13278-026-01584-6","pdf_url":null,"source":{"id":"https://openalex.org/S2764891196","display_name":"Social Network Analysis and Mining","issn_l":"1869-5450","issn":["1869-5450","1869-5469"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Social Network Analysis and Mining","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1007/s13278-026-01584-6","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025629843","display_name":"Tiago Can\u00e1rio","orcid":null},"institutions":[{"id":"https://openalex.org/I83558840","display_name":"Universidade Nova de Lisboa","ror":"https://ror.org/02xankh89","country_code":"PT","type":"education","lineage":["https://openalex.org/I83558840"]}],"countries":["PT"],"is_corresponding":true,"raw_author_name":"Tiago G. Can\u00e1rio","raw_affiliation_strings":["NOVA Information Management School (NOVA IMS), Universidade Nova de Lisboa, Campus de Campolide, 1070-312, Lisboa, Portugal"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NOVA Information Management School (NOVA IMS), Universidade Nova de Lisboa, Campus de Campolide, 1070-312, Lisboa, Portugal","institution_ids":["https://openalex.org/I83558840"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042632378","display_name":"Catarina M.M. Duarte","orcid":"https://orcid.org/0000-0002-4633-5979"},"institutions":[{"id":"https://openalex.org/I83558840","display_name":"Universidade Nova de Lisboa","ror":"https://ror.org/02xankh89","country_code":"PT","type":"education","lineage":["https://openalex.org/I83558840"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Catarina Duarte","raw_affiliation_strings":["NOVA Information Management School (NOVA IMS), Universidade Nova de Lisboa, Campus de Campolide, 1070-312, Lisboa, Portugal"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NOVA Information Management School (NOVA IMS), Universidade Nova de Lisboa, Campus de Campolide, 1070-312, Lisboa, Portugal","institution_ids":["https://openalex.org/I83558840"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056296020","display_name":"Fl\u00e1vio L. Pinheiro","orcid":"https://orcid.org/0000-0002-0561-9641"},"institutions":[{"id":"https://openalex.org/I83558840","display_name":"Universidade Nova de Lisboa","ror":"https://ror.org/02xankh89","country_code":"PT","type":"education","lineage":["https://openalex.org/I83558840"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Fl\u00e1vio L. Pinheiro","raw_affiliation_strings":["NOVA Information Management School (NOVA IMS), Universidade Nova de Lisboa, Campus de Campolide, 1070-312, Lisboa, Portugal"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NOVA Information Management School (NOVA IMS), Universidade Nova de Lisboa, Campus de Campolide, 1070-312, Lisboa, Portugal","institution_ids":["https://openalex.org/I83558840"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102007589","display_name":"Jo\u00e3o L. M. Pereira","orcid":"https://orcid.org/0000-0002-3247-5524"},"institutions":[{"id":"https://openalex.org/I21803372","display_name":"University of \u00c9vora","ror":"https://ror.org/02gyps716","country_code":"PT","type":"education","lineage":["https://openalex.org/I21803372"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Jo\u00e3o L. M. Pereira","raw_affiliation_strings":["Centro Algoritmi/LASI, University of \u00c9vora, 7000-671, \u00c9vora, Portugal"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centro Algoritmi/LASI, University of \u00c9vora, 7000-671, \u00c9vora, Portugal","institution_ids":["https://openalex.org/I21803372"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5025629843"],"corresponding_institution_ids":["https://openalex.org/I83558840"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.32314018,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"16","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4381999969482422,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4381999969482422,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.06390000134706497,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.05909999832510948,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7121000289916992},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6762999892234802},{"id":"https://openalex.org/keywords/portuguese","display_name":"Portuguese","score":0.6036999821662903},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5891000032424927},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.527999997138977},{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.5224000215530396},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.490200012922287},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.4713999927043915}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8015000224113464},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7121000289916992},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6762999892234802},{"id":"https://openalex.org/C35219183","wikidata":"https://www.wikidata.org/wiki/Q5146","display_name":"Portuguese","level":2,"score":0.6036999821662903},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5891000032424927},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5652999877929688},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.527999997138977},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.5224000215530396},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5180000066757202},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.490200012922287},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.4713999927043915},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.4546999931335449},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.436599999666214},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3840000033378601},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.35580000281333923},{"id":"https://openalex.org/C153604712","wikidata":"https://www.wikidata.org/wiki/Q7310755","display_name":"Relationship extraction","level":3,"score":0.3433000147342682},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3352000117301941},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.33390000462532043},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.3273000121116638},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30889999866485596},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.29409998655319214},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.2919999957084656},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.27639999985694885}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s13278-026-01584-6","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s13278-026-01584-6","pdf_url":null,"source":{"id":"https://openalex.org/S2764891196","display_name":"Social Network Analysis and Mining","issn_l":"1869-5450","issn":["1869-5450","1869-5469"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Social Network Analysis and Mining","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s13278-026-01584-6","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s13278-026-01584-6","pdf_url":null,"source":{"id":"https://openalex.org/S2764891196","display_name":"Social Network Analysis and Mining","issn_l":"1869-5450","issn":["1869-5450","1869-5469"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Social Network Analysis and Mining","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.8183728456497192,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1519756925","https://openalex.org/W1986825611","https://openalex.org/W2009434538","https://openalex.org/W2010771292","https://openalex.org/W2021224503","https://openalex.org/W2061863227","https://openalex.org/W2062019458","https://openalex.org/W2093044076","https://openalex.org/W2182410279","https://openalex.org/W2187389059","https://openalex.org/W2193641145","https://openalex.org/W2234547888","https://openalex.org/W2250709464","https://openalex.org/W2250761302","https://openalex.org/W2251483280","https://openalex.org/W2337121348","https://openalex.org/W2544696940","https://openalex.org/W2548543055","https://openalex.org/W2599805910","https://openalex.org/W2766623381","https://openalex.org/W2913389685","https://openalex.org/W2938716404","https://openalex.org/W2946356689","https://openalex.org/W2952411148","https://openalex.org/W2953647140","https://openalex.org/W3037850407","https://openalex.org/W3096366085","https://openalex.org/W3104415840","https://openalex.org/W3177049011","https://openalex.org/W3195349883","https://openalex.org/W4290879105","https://openalex.org/W4295847212","https://openalex.org/W4382866372","https://openalex.org/W4383679902","https://openalex.org/W4383737590","https://openalex.org/W4387021627","https://openalex.org/W4403157697","https://openalex.org/W4404781463"],"related_works":[],"abstract_inverted_index":{"The":[0,202],"Automatic":[1],"identification":[2],"of":[3,47,65,121,130,135,151,185],"characters":[4,137],"and":[5,33,107,118,138,142,153,183,191],"their":[6],"interactions":[7,197],"from":[8,84],"literary":[9,85],"fiction":[10,86],"is,":[11],"arguably,":[12],"a":[13,63,74,92,119],"complex":[14],"task":[15,134],"that":[16,19,98],"requires":[17],"pipelines":[18],"leverage":[20],"multiple":[21],"Natural":[22],"Language":[23,109],"Processing":[24],"(NLP)":[25],"methods,":[26],"such":[27],"as":[28,198],"Named":[29],"Entity":[30],"Recognition":[31],"(NER)":[32],"Part-of-speech":[34],"(POS)":[35],"tagging.":[36],"However,":[37],"these":[38],"methods":[39,53,173],"are":[40,170,189],"not":[41],"optimized":[42],"for":[43,69,140,174,214],"retrieving":[44],"Social":[45],"Networks":[46],"Characters.":[48],"Indeed,":[49],"the":[50,133,156,160,181,193,199,215],"currently":[51],"available":[52,102,162,207],"tend":[54],"to":[55,62,80,100,167,208],"underperform,":[56],"especially":[57],"in":[58,88,132,144,192,211],"less-represented":[59],"languages,":[60],"due":[61],"lack":[64],"manually":[66],"annotated":[67],"data":[68],"training.":[70],"Here,":[71],"we":[72,77],"propose":[73],"pipeline,":[75,113],"which":[76,114],"call":[78],"Taggus,":[79],"extract":[81],"social":[82],"networks":[83],"works":[87],"Portuguese":[89,216],"without":[90],"requiring":[91],"training":[93],"phase.":[94],"Our":[95],"results":[96,125,157,169],"show":[97],"compared":[99],"readily":[101,161],"State-of-the-Art":[103,163],"tools\u2014off-the-shelf":[104],"NER":[105],"tools":[106],"Large":[108],"Models":[110],"(ChatGPT)\u2014the":[111],"resulting":[112],"uses":[115],"POS":[116],"tagging":[117],"combination":[120],"heuristics,":[122],"achieves":[123],"satisfying":[124],"with":[126],"an":[127],"average":[128],"F1-Score":[129],"$$92.1\\%$$":[131],"identifying":[136],"solving":[139],"co-reference":[141],"$$74.0\\%$$":[143],"interaction":[145],"detection.":[146],"These":[147],"represent,":[148],"respectively,":[149],"increases":[150],"$$115.7\\%$$":[152],"$$38.1\\%$$":[154],"over":[155],"achieved":[158],"by":[159],"tools.":[164],"Further":[165],"steps":[166],"improve":[168],"outlined,":[171],"including":[172],"detecting":[175],"relationships":[176],"among":[177],"characters.":[178],"Limitations":[179],"on":[180,196],"size":[182],"scope":[184],"our":[186],"testing":[187],"samples":[188],"acknowledged":[190],"exclusive":[194],"focus":[195],"relationship":[200],"type.":[201],"Taggus":[203],"pipeline":[204],"is":[205],"publicly":[206],"encourage":[209],"development":[210],"this":[212],"field":[213],"language.":[217]},"counts_by_year":[],"updated_date":"2026-04-30T09:15:22.047038","created_date":"2026-02-19T00:00:00"}
