{"id":"https://openalex.org/W4414254078","doi":"https://doi.org/10.1007/978-3-032-04624-6_20","title":"Evaluating Handwritten Text Recognition in\u00a0Medieval Notarial Manuscripts: A\u00a0New Dataset and\u00a0Comprehensive Analysis","display_name":"Evaluating Handwritten Text Recognition in\u00a0Medieval Notarial Manuscripts: A\u00a0New Dataset and\u00a0Comprehensive Analysis","publication_year":2025,"publication_date":"2025-09-16","ids":{"openalex":"https://openalex.org/W4414254078","doi":"https://doi.org/10.1007/978-3-032-04624-6_20"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-032-04624-6_20","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-032-04624-6_20","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1007/978-3-032-04624-6_20","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051763204","display_name":"Mariona Coll Ardanuy","orcid":"https://orcid.org/0000-0001-8455-7196"},"institutions":[{"id":"https://openalex.org/I2799803557","display_name":"Barcelona Supercomputing Center","ror":"https://ror.org/05sd8tv96","country_code":"ES","type":"facility","lineage":["https://openalex.org/I2799803557","https://openalex.org/I9617848"]},{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Mariona Coll Ardanuy","raw_affiliation_strings":["Barcelona Supercomputing Center (BSC), Barcelona, Spain"],"raw_orcid":"https://orcid.org/0000-0001-8455-7196","affiliations":[{"raw_affiliation_string":"Barcelona Supercomputing Center (BSC), Barcelona, Spain","institution_ids":["https://openalex.org/I9617848","https://openalex.org/I2799803557"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003682850","display_name":"Iban Berganzo\u2010Besga","orcid":"https://orcid.org/0000-0002-6161-2452"},"institutions":[{"id":"https://openalex.org/I2799803557","display_name":"Barcelona Supercomputing Center","ror":"https://ror.org/05sd8tv96","country_code":"ES","type":"facility","lineage":["https://openalex.org/I2799803557","https://openalex.org/I9617848"]},{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Iban Berganzo-Besga","raw_affiliation_strings":["Barcelona Supercomputing Center (BSC), Barcelona, Spain"],"raw_orcid":"https://orcid.org/0000-0002-6161-2452","affiliations":[{"raw_affiliation_string":"Barcelona Supercomputing Center (BSC), Barcelona, Spain","institution_ids":["https://openalex.org/I9617848","https://openalex.org/I2799803557"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059983436","display_name":"Ramon Sarobe Huesca","orcid":"https://orcid.org/0000-0003-2099-3567"},"institutions":[{"id":"https://openalex.org/I2799803557","display_name":"Barcelona Supercomputing Center","ror":"https://ror.org/05sd8tv96","country_code":"ES","type":"facility","lineage":["https://openalex.org/I2799803557","https://openalex.org/I9617848"]},{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Ramon Sarobe","raw_affiliation_strings":["Barcelona Supercomputing Center (BSC), Barcelona, Spain"],"raw_orcid":"https://orcid.org/0000-0003-2099-3567","affiliations":[{"raw_affiliation_string":"Barcelona Supercomputing Center (BSC), Barcelona, Spain","institution_ids":["https://openalex.org/I9617848","https://openalex.org/I2799803557"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5119639624","display_name":"Coral Cuadrada","orcid":"https://orcid.org/0000-0003-4577-2381"},"institutions":[{"id":"https://openalex.org/I2799803557","display_name":"Barcelona Supercomputing Center","ror":"https://ror.org/05sd8tv96","country_code":"ES","type":"facility","lineage":["https://openalex.org/I2799803557","https://openalex.org/I9617848"]},{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Coral Cuadrada","raw_affiliation_strings":["Barcelona Supercomputing Center (BSC), Barcelona, Spain"],"raw_orcid":"https://orcid.org/0000-0003-4577-2381","affiliations":[{"raw_affiliation_string":"Barcelona Supercomputing Center (BSC), Barcelona, Spain","institution_ids":["https://openalex.org/I9617848","https://openalex.org/I2799803557"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5051763204"],"corresponding_institution_ids":["https://openalex.org/I2799803557","https://openalex.org/I9617848"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":{"value":5000,"currency":"EUR","value_usd":5392},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.54388133,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"340","last_page":"357"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9872999787330627,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.97079998254776,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parchment","display_name":"Parchment","score":0.6960999965667725},{"id":"https://openalex.org/keywords/handwriting","display_name":"Handwriting","score":0.6682999730110168},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5706999897956848},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.5490999817848206},{"id":"https://openalex.org/keywords/handwriting-recognition","display_name":"Handwriting recognition","score":0.5288000106811523},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.4745999872684479},{"id":"https://openalex.org/keywords/historical-document","display_name":"Historical document","score":0.4489000141620636},{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription (linguistics)","score":0.4253000020980835},{"id":"https://openalex.org/keywords/catalan","display_name":"Catalan","score":0.38499999046325684}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8647000193595886},{"id":"https://openalex.org/C2780845164","wikidata":"https://www.wikidata.org/wiki/Q226697","display_name":"Parchment","level":2,"score":0.6960999965667725},{"id":"https://openalex.org/C2779386606","wikidata":"https://www.wikidata.org/wiki/Q2393642","display_name":"Handwriting","level":2,"score":0.6682999730110168},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5706999897956848},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5655999779701233},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.5490999817848206},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5309000015258789},{"id":"https://openalex.org/C112640561","wikidata":"https://www.wikidata.org/wiki/Q2440634","display_name":"Handwriting recognition","level":3,"score":0.5288000106811523},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.4745999872684479},{"id":"https://openalex.org/C2778371909","wikidata":"https://www.wikidata.org/wiki/Q3771738","display_name":"Historical document","level":2,"score":0.4489000141620636},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.4253000020980835},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4034999907016754},{"id":"https://openalex.org/C164105321","wikidata":"https://www.wikidata.org/wiki/Q7026","display_name":"Catalan","level":2,"score":0.38499999046325684},{"id":"https://openalex.org/C9299288","wikidata":"https://www.wikidata.org/wiki/Q1163234","display_name":"Medieval Latin","level":2,"score":0.3709000051021576},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.3386000096797943},{"id":"https://openalex.org/C154775046","wikidata":"https://www.wikidata.org/wiki/Q188","display_name":"German","level":2,"score":0.31349998712539673},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.29499998688697815},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.2802000045776367},{"id":"https://openalex.org/C142853389","wikidata":"https://www.wikidata.org/wiki/Q744778","display_name":"Association (psychology)","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C2983812711","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text recognition","level":3,"score":0.2680000066757202},{"id":"https://openalex.org/C2778310199","wikidata":"https://www.wikidata.org/wiki/Q194070","display_name":"Facsimile","level":3,"score":0.26190000772476196},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.25859999656677246},{"id":"https://openalex.org/C143128703","wikidata":"https://www.wikidata.org/wiki/Q12554","display_name":"Middle Ages","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2551000118255615},{"id":"https://openalex.org/C67905146","wikidata":"https://www.wikidata.org/wiki/Q5287646","display_name":"Document processing","level":2,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-032-04624-6_20","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-032-04624-6_20","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.1007/978-3-032-04624-6_20","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-032-04624-6_20","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2008274828","https://openalex.org/W2048176942","https://openalex.org/W2127141656","https://openalex.org/W2149128132","https://openalex.org/W2785892129","https://openalex.org/W2786974559","https://openalex.org/W2787677190","https://openalex.org/W2890571723","https://openalex.org/W2911227954","https://openalex.org/W2984055017","https://openalex.org/W3012289950","https://openalex.org/W3181798399","https://openalex.org/W3212368439","https://openalex.org/W4206244669","https://openalex.org/W4221050583","https://openalex.org/W4303945557","https://openalex.org/W4308571509","https://openalex.org/W4311363515","https://openalex.org/W4318263479","https://openalex.org/W4365143033","https://openalex.org/W4382202677","https://openalex.org/W4388098581","https://openalex.org/W4391767333","https://openalex.org/W4392952747","https://openalex.org/W4393699312","https://openalex.org/W4394828349","https://openalex.org/W4402667133","https://openalex.org/W6892792744","https://openalex.org/W6931716462","https://openalex.org/W6948623437","https://openalex.org/W6949605097"],"related_works":[],"abstract_inverted_index":{"Vast":[0],"amounts":[1],"of":[2,45,69,126,130,148,207,220,228],"medieval":[3,50],"notarial":[4,54],"documents":[5,30],"have":[6,140],"been":[7],"preserved":[8],"and":[9,99,104,107,128,165,212],"digitized":[10,71],"in":[11,21,85,113,118,133,144,196],"Catalan":[12],"archives.":[13],"These":[14],"collections":[15],"provide":[16,186],"invaluable":[17],"insights":[18],"into":[19,155],"life":[20],"the":[22,43,60,79,86,218],"Middle":[23],"Ages.":[24],"To":[25],"harness":[26],"their":[27],"full":[28],"potential,":[29],"need":[31],"to":[32,62,77,101,190],"be":[33],"accurately":[34],"transcribed.":[35],"This":[36],"paper":[37],"introduces":[38],"a":[39,134,181,187,199,205],"new":[40],"dataset":[41,66,171],"for":[42,223],"task":[44],"handwritten":[46],"text":[47],"recognition":[48,147],"on":[49,53,57,169],"manuscripts,":[51,150],"focusing":[52],"charters":[55],"written":[56],"parchment":[58],"from":[59,179],"13th":[61],"15th":[63],"centuries.":[64,110],"Our":[65],"is":[67,83],"comprised":[68],"100":[70],"manuscripts":[72,122],"(3,369":[73],"lines),":[74],"carefully":[75,200],"selected":[76],"represent":[78],"large":[80],"variation":[81],"that":[82,159,173,216],"present":[84],"sources,":[87],"encompassing":[88],"at":[89],"least":[90],"80":[91],"distinct":[92],"hands,":[93],"various":[94],"document":[95],"types":[96],"(from":[97],"sales":[98],"inventories":[100],"last":[102],"wills":[103],"marriage":[105],"contracts),":[106],"spanning":[108],"three":[109],"Written":[111],"primarily":[112],"Medieval":[114,119],"Latin":[115],"with":[116,151,198],"fragments":[117],"Catalan,":[120],"these":[121,174],"exhibit":[123],"varying":[124],"stages":[125],"preservation":[127],"degrees":[129],"deterioration,":[131],"resulting":[132],"very":[135],"diverse":[136],"dataset.":[137,202],"Recent":[138],"years":[139],"seen":[141],"impressive":[142],"advancements":[143],"automatic":[145],"handwriting":[146],"historical":[149,229],"significant":[152],"effort":[153],"put":[154],"creating":[156],"general":[157],"models":[158,175,193],"perform":[160],"well":[161],"across":[162],"several":[163],"centuries":[164],"scripts.":[166],"The":[167],"experiments":[168,208],"our":[170],"show":[172],"are":[176],"still":[177],"far":[178],"providing":[180],"generalizable":[182],"solution,":[183],"but":[184],"nevertheless":[185],"good":[188],"foundation":[189],"fine-tune":[191],"robust":[192],"when":[194],"used":[195],"combination":[197],"curated":[201],"We":[203],"report":[204],"series":[206],"using":[209],"an":[210,225],"extensive":[211],"nuanced":[213],"evaluation":[214],"approach":[215],"demonstrates":[217],"importance":[219],"data":[221],"selection":[222],"achieving":[224],"accurate":[226],"transcription":[227],"manuscripts.":[230]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
