{"id":"https://openalex.org/W4407667616","doi":"https://doi.org/10.1007/s00799-025-00413-z","title":"Enhancing OCR in historical documents with complex layouts through machine learning","display_name":"Enhancing OCR in historical documents with complex layouts through machine learning","publication_year":2025,"publication_date":"2025-02-17","ids":{"openalex":"https://openalex.org/W4407667616","doi":"https://doi.org/10.1007/s00799-025-00413-z"},"language":"en","primary_location":{"id":"doi:10.1007/s00799-025-00413-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00799-025-00413-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00799-025-00413-z.pdf","source":{"id":"https://openalex.org/S110615584","display_name":"International Journal on Digital Libraries","issn_l":"1432-1300","issn":["1432-1300","1432-5012"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal on Digital Libraries","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00799-025-00413-z.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093734247","display_name":"David Fleischhacker","orcid":"https://orcid.org/0009-0003-4787-9091"},"institutions":[{"id":"https://openalex.org/I4092182","display_name":"Graz University of Technology","ror":"https://ror.org/00d7xrm67","country_code":"AT","type":"education","lineage":["https://openalex.org/I4092182"]}],"countries":["AT"],"is_corresponding":true,"raw_author_name":"David Fleischhacker","raw_affiliation_strings":["Institute of Interactive Systems and Data Science, Graz University of Technology, Sandgasse 36, 8010, Graz, Austria"],"raw_orcid":"https://orcid.org/0009-0003-4787-9091","affiliations":[{"raw_affiliation_string":"Institute of Interactive Systems and Data Science, Graz University of Technology, Sandgasse 36, 8010, Graz, Austria","institution_ids":["https://openalex.org/I4092182"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014398832","display_name":"Roman Kern","orcid":"https://orcid.org/0000-0003-0202-6100"},"institutions":[{"id":"https://openalex.org/I4092182","display_name":"Graz University of Technology","ror":"https://ror.org/00d7xrm67","country_code":"AT","type":"education","lineage":["https://openalex.org/I4092182"]},{"id":"https://openalex.org/I4210088621","display_name":"Know Center Research GmbH (Austria)","ror":"https://ror.org/004zhad81","country_code":"AT","type":"company","lineage":["https://openalex.org/I4210088621"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Roman Kern","raw_affiliation_strings":["Institute of Interactive Systems and Data Science, Graz University of Technology, Sandgasse 36, 8010, Graz, Austria","Know Center, Sandgasse 36, 8010, Graz, Austria"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Interactive Systems and Data Science, Graz University of Technology, Sandgasse 36, 8010, Graz, Austria","institution_ids":["https://openalex.org/I4092182"]},{"raw_affiliation_string":"Know Center, Sandgasse 36, 8010, Graz, Austria","institution_ids":["https://openalex.org/I4210088621"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068741102","display_name":"Wolfgang G\u00f6derle","orcid":"https://orcid.org/0000-0002-9417-5316"},"institutions":[{"id":"https://openalex.org/I190249584","display_name":"Universit\u00e4t Innsbruck","ror":"https://ror.org/054pv6659","country_code":"AT","type":"education","lineage":["https://openalex.org/I190249584"]},{"id":"https://openalex.org/I4210161060","display_name":"Max Planck Institute for the Science of Human History","ror":"https://ror.org/05mjrzy91","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210161060"]}],"countries":["AT","DE"],"is_corresponding":false,"raw_author_name":"Wolfgang G\u00f6derle","raw_affiliation_strings":["Department Structural Changes of the Technosphere, Max Planck Institute of Geoanthropology, Kahlaische Strasse 10, 07745, Jena, Germany","Department of Austrian History, Institute of History, University of Innsbruck, Innrain 52, 6020, Innsbruck, Austria"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department Structural Changes of the Technosphere, Max Planck Institute of Geoanthropology, Kahlaische Strasse 10, 07745, Jena, Germany","institution_ids":["https://openalex.org/I4210161060"]},{"raw_affiliation_string":"Department of Austrian History, Institute of History, University of Innsbruck, Innrain 52, 6020, Innsbruck, Austria","institution_ids":["https://openalex.org/I190249584"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5093734247"],"corresponding_institution_ids":["https://openalex.org/I4092182"],"apc_list":{"value":2290,"currency":"EUR","value_usd":2890},"apc_paid":{"value":2290,"currency":"EUR","value_usd":2890},"fwci":12.0523,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.98686557,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"26","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.986299991607666,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8545206785202026},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5167288184165955},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4417835474014282},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4360649883747101},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.4173118472099304}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8545206785202026},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5167288184165955},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4417835474014282},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4360649883747101},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.4173118472099304}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1007/s00799-025-00413-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00799-025-00413-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00799-025-00413-z.pdf","source":{"id":"https://openalex.org/S110615584","display_name":"International Journal on Digital Libraries","issn_l":"1432-1300","issn":["1432-1300","1432-5012"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal on Digital Libraries","raw_type":"journal-article"},{"id":"pmh:oai:econstor.eu:10419/319163","is_oa":true,"landing_page_url":"https://hdl.handle.net/10419/319163","pdf_url":"https://www.econstor.eu/bitstream/10419/319163/1/00799_2025_Article_413.pdf","source":{"id":"https://openalex.org/S4306401696","display_name":"Econstor (Econstor)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"doc-type:article"},{"id":"pmh:oai:econstor.eu:10419/323277","is_oa":true,"landing_page_url":"https://hdl.handle.net/10419/323277","pdf_url":"https://www.econstor.eu/bitstream/10419/323277/1/00799_2025_Article_413.pdf","source":{"id":"https://openalex.org/S4306401696","display_name":"Econstor (Econstor)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"doc-type:article"},{"id":"pmh:oai:pure.mpg.de:item_3637790","is_oa":true,"landing_page_url":"http://hdl.handle.net/21.11116/0000-0010-C7B6-0","pdf_url":null,"source":{"id":"https://openalex.org/S4306400654","display_name":"MPG.PuRe (Max Planck Society)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I149899117","host_organization_name":"Max Planck Society","host_organization_lineage":["https://openalex.org/I149899117"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"International Journal on Digital Libraries","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"doi:10.1007/s00799-025-00413-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00799-025-00413-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00799-025-00413-z.pdf","source":{"id":"https://openalex.org/S110615584","display_name":"International Journal on Digital Libraries","issn_l":"1432-1300","issn":["1432-1300","1432-5012"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal on Digital Libraries","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320310430","display_name":"TU Graz, Internationale Beziehungen und Mobilit\u00e4tsprogramme","ror":"https://ror.org/00d7xrm67"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4407667616.pdf"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W1598866093","https://openalex.org/W2487933861","https://openalex.org/W2787480186","https://openalex.org/W2902561591","https://openalex.org/W2943472041","https://openalex.org/W2943942362","https://openalex.org/W2973047034","https://openalex.org/W2980913015","https://openalex.org/W2997154779","https://openalex.org/W3004524434","https://openalex.org/W3021347667","https://openalex.org/W3023805750","https://openalex.org/W3065976884","https://openalex.org/W3090423411","https://openalex.org/W3104953317","https://openalex.org/W3105988348","https://openalex.org/W3122950209","https://openalex.org/W3132296545","https://openalex.org/W3163273160","https://openalex.org/W3194824089","https://openalex.org/W3216272314","https://openalex.org/W4205868038","https://openalex.org/W4210446100","https://openalex.org/W4226236673","https://openalex.org/W4252392280","https://openalex.org/W4281859181","https://openalex.org/W4306385899","https://openalex.org/W4318465586"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Abstract":[0],"This":[1],"paper":[2],"explores":[3],"the":[4,19,29,38,56,62,74,84,91,107,128,148,177,184],"challenge":[5],"of":[6,14,31,64,99,113,162,179,188],"processing":[7],"and":[8,52,61,132,145,152,168,186],"extracting":[9],"information":[10],"from":[11,18],"large":[12],"quantities":[13],"printed":[15],"serial":[16],"sources":[17],"19th":[20],"century,":[21],"which":[22],"have":[23],"been":[24],"largely":[25],"untapped":[26],"due":[27],"to":[28,83,126],"inadequacies":[30],"existing":[32],"extraction":[33,131,185],"techniques.":[34],"We":[35,86],"focus":[36],"on":[37],"Habsburg":[39,57],"Central":[40],"Europe\u2019s":[41],"Hof-":[42,92],"und":[43,93],"Staatsschematismus":[44,94],",":[45],"a":[46,100,110,157],"comprehensive":[47],"record":[48],"published":[49],"between":[50],"1702":[51],"1918":[53],"that":[54],"documents":[55],"civil":[58],"service\u2019s":[59],"hierarchy":[60],"evolution":[63],"its":[65],"central":[66],"administration":[67],"over":[68],"two":[69],"centuries.":[70],"Our":[71,135],"approach":[72],"sees":[73],"significant":[75,138],"investment":[76],"into":[77],"machine":[78],"learning-driven":[79],"layout":[80],"detection":[81,151],"prior":[82],"OCR-process.":[85],"generated":[87],"synthetic":[88],"data":[89],"mimicking":[90],"style":[95,125],"for":[96,122,166,172],"initial":[97],"training":[98],"Faster":[101],"R-CNN":[102],"model,":[103],"followed":[104],"by":[105],"fine-tuning":[106],"model":[108],"with":[109,147],"smaller":[111],"dataset":[112],"manually":[114],"annotated":[115],"historical":[116,189],"documents.":[117,190],"Subsequently,":[118],"we":[119],"optimised":[120],"Tesseract-OCR":[121],"our":[123],"document":[124],"enhance":[127],"combined":[129,149],"structure":[130,150],"OCR":[133,141,154],"process.":[134],"evaluation":[136],"demonstrates":[137],"improvements":[139],"in":[140,159,182],"performance":[142],"metrics":[143],"(WER":[144],"CER),":[146],"fine-tuned":[153],"process":[155],"showing":[156],"decrease":[158],"error":[160],"rates":[161],"15.68":[163],"percentage":[164,170],"points":[165,171],"CER":[167],"19.95":[169],"WER.":[173],"These":[174],"findings":[175],"underscore":[176],"potential":[178],"ML":[180],"techniques":[181],"facilitating":[183],"analysis":[187]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":11}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
