{"id":"https://openalex.org/W4403616351","doi":"https://doi.org/10.1007/s10462-024-11000-0","title":"A survey of recent approaches to form understanding in scanned documents","display_name":"A survey of recent approaches to form understanding in scanned documents","publication_year":2024,"publication_date":"2024-10-21","ids":{"openalex":"https://openalex.org/W4403616351","doi":"https://doi.org/10.1007/s10462-024-11000-0"},"language":"en","primary_location":{"id":"doi:10.1007/s10462-024-11000-0","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10462-024-11000-0","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10462-024-11000-0.pdf","source":{"id":"https://openalex.org/S122814990","display_name":"Artificial Intelligence Review","issn_l":"0269-2821","issn":["0269-2821","1573-7462"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Artificial Intelligence Review","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10462-024-11000-0.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064852810","display_name":"Abdelrahman Abdallah","orcid":"https://orcid.org/0000-0001-8747-4927"},"institutions":[{"id":"https://openalex.org/I190249584","display_name":"Universit\u00e4t Innsbruck","ror":"https://ror.org/054pv6659","country_code":"AT","type":"education","lineage":["https://openalex.org/I190249584"]}],"countries":["AT"],"is_corresponding":true,"raw_author_name":"Abdelrahman Abdallah","raw_affiliation_strings":["Department of Computer Science, University of Innsbruck, 6020, Innsbruck, Tirol, Austria"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Innsbruck, 6020, Innsbruck, Tirol, Austria","institution_ids":["https://openalex.org/I190249584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094105680","display_name":"Daniel Eberharter","orcid":null},"institutions":[{"id":"https://openalex.org/I190249584","display_name":"Universit\u00e4t Innsbruck","ror":"https://ror.org/054pv6659","country_code":"AT","type":"education","lineage":["https://openalex.org/I190249584"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Daniel Eberharter","raw_affiliation_strings":["Department of Computer Science, University of Innsbruck, 6020, Innsbruck, Tirol, Austria"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Innsbruck, 6020, Innsbruck, Tirol, Austria","institution_ids":["https://openalex.org/I190249584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094105681","display_name":"Zoe Pfister","orcid":null},"institutions":[{"id":"https://openalex.org/I190249584","display_name":"Universit\u00e4t Innsbruck","ror":"https://ror.org/054pv6659","country_code":"AT","type":"education","lineage":["https://openalex.org/I190249584"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Zoe Pfister","raw_affiliation_strings":["Department of Computer Science, University of Innsbruck, 6020, Innsbruck, Tirol, Austria"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Innsbruck, 6020, Innsbruck, Tirol, Austria","institution_ids":["https://openalex.org/I190249584"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079733597","display_name":"Adam Jatowt","orcid":"https://orcid.org/0000-0001-7235-0665"},"institutions":[{"id":"https://openalex.org/I190249584","display_name":"Universit\u00e4t Innsbruck","ror":"https://ror.org/054pv6659","country_code":"AT","type":"education","lineage":["https://openalex.org/I190249584"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Adam Jatowt","raw_affiliation_strings":["Department of Computer Science, University of Innsbruck, 6020, Innsbruck, Tirol, Austria"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Innsbruck, 6020, Innsbruck, Tirol, Austria","institution_ids":["https://openalex.org/I190249584"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5064852810"],"corresponding_institution_ids":["https://openalex.org/I190249584"],"apc_list":{"value":2490,"currency":"EUR","value_usd":3090},"apc_paid":{"value":2490,"currency":"EUR","value_usd":3090},"fwci":1.7296,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.86185046,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"57","issue":"12","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7409399151802063},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.5011239051818848},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.401563823223114}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7409399151802063},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5011239051818848},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.401563823223114}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10462-024-11000-0","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10462-024-11000-0","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10462-024-11000-0.pdf","source":{"id":"https://openalex.org/S122814990","display_name":"Artificial Intelligence Review","issn_l":"0269-2821","issn":["0269-2821","1573-7462"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Artificial Intelligence Review","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10462-024-11000-0","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10462-024-11000-0","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10462-024-11000-0.pdf","source":{"id":"https://openalex.org/S122814990","display_name":"Artificial Intelligence Review","issn_l":"0269-2821","issn":["0269-2821","1573-7462"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Artificial Intelligence Review","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4403616351.pdf"},"referenced_works_count":73,"referenced_works":["https://openalex.org/W1966382373","https://openalex.org/W2024959534","https://openalex.org/W2070836593","https://openalex.org/W2194775991","https://openalex.org/W2510759893","https://openalex.org/W2549139847","https://openalex.org/W2565639579","https://openalex.org/W2943845043","https://openalex.org/W2945784886","https://openalex.org/W2949212908","https://openalex.org/W2963150697","https://openalex.org/W2963341956","https://openalex.org/W2980913015","https://openalex.org/W2986619406","https://openalex.org/W2988217457","https://openalex.org/W2988326850","https://openalex.org/W2997154779","https://openalex.org/W3003428515","https://openalex.org/W3003484198","https://openalex.org/W3003711898","https://openalex.org/W3004330198","https://openalex.org/W3092009239","https://openalex.org/W3093218477","https://openalex.org/W3100219394","https://openalex.org/W3104953317","https://openalex.org/W3120043490","https://openalex.org/W3163650427","https://openalex.org/W3173325518","https://openalex.org/W3176664887","https://openalex.org/W3176851559","https://openalex.org/W3182680257","https://openalex.org/W3200439183","https://openalex.org/W3202839357","https://openalex.org/W3205981739","https://openalex.org/W4213019189","https://openalex.org/W4214493665","https://openalex.org/W4224228116","https://openalex.org/W4226020328","https://openalex.org/W4245031736","https://openalex.org/W4285241172","https://openalex.org/W4304013646","https://openalex.org/W4304698333","https://openalex.org/W4312233877","https://openalex.org/W4319300491","https://openalex.org/W4322747033","https://openalex.org/W4376226279","https://openalex.org/W4384636790","https://openalex.org/W4385574075","https://openalex.org/W4385768059","https://openalex.org/W4385990987","https://openalex.org/W4385991043","https://openalex.org/W4386065837","https://openalex.org/W4386076403","https://openalex.org/W4386221015","https://openalex.org/W4386566506","https://openalex.org/W4388187290","https://openalex.org/W4389520670","https://openalex.org/W4393152682","https://openalex.org/W4393154852","https://openalex.org/W4393160827","https://openalex.org/W4395111538","https://openalex.org/W4402702988","https://openalex.org/W6600175266","https://openalex.org/W6600424091","https://openalex.org/W6600545252","https://openalex.org/W6600741150","https://openalex.org/W6601211009","https://openalex.org/W6602426847","https://openalex.org/W6605755270","https://openalex.org/W6605991194","https://openalex.org/W6607281299","https://openalex.org/W6702248584","https://openalex.org/W6831684532"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Abstract":[0],"This":[1],"paper":[2],"presents":[3],"a":[4],"comprehensive":[5],"survey":[6],"of":[7,15,21,68,96,128,147,154,162],"over":[8,73],"100":[9],"research":[10,62],"works":[11],"on":[12,37],"the":[13,19,32,74,94,110,129,145,148,152,181],"topic":[14],"form":[16,48,166,187],"understanding":[17,49,188],"in":[18,31,47,55,120,164,179],"context":[20],"scanned":[22,115],"documents.":[23],"We":[24],"delve":[25],"into":[26,93],"recent":[27],"advancements":[28],"and":[29,71,81,137,157,174],"breakthroughs":[30],"field,":[33],"with":[34,117,176],"particular":[35],"focus":[36],"transformer-based":[38],"models,":[39],"which":[40,139],"have":[41,104],"been":[42],"shown":[43],"to":[44,53,58,112,171],"improve":[45],"performance":[46,146],"tasks":[50],"by":[51,108],"up":[52],"25%":[54],"accuracy":[56],"compared":[57],"traditional":[59],"methods.":[60],"Our":[61],"methodology":[63],"involves":[64],"an":[65,126,159],"in-depth":[66],"analysis":[67],"popular":[69],"documents":[70,116],"trends":[72],"last":[75],"decade,":[76],"including":[77],"15":[78],"state-of-the-art":[79],"models":[80,156],"10":[82],"benchmark":[83],"datasets.":[84],"By":[85,150],"examining":[86],"these":[87,155],"works,":[88],"we":[89,100,124,169],"offer":[90],"novel":[91],"insights":[92],"evolution":[95],"this":[97],"domain.":[98],"Specifically,":[99],"highlight":[101],"how":[102],"transformers":[103],"revolutionized":[105],"form-understanding":[106],"techniques":[107],"enhancing":[109],"ability":[111],"process":[113],"noisy":[114],"significant":[118],"improvements":[119],"OCR":[121],"accuracy.":[122],"Furthermore,":[123],"present":[125],"overview":[127],"most":[130,182],"relevant":[131],"datasets,":[132],"such":[133],"as":[134,141],"FUNSD,":[135],"CORD,":[136],"SROIE,":[138],"serve":[140],"benchmarks":[142],"for":[143,185],"evaluating":[144],"models.":[149],"comparing":[151],"capabilities":[153],"reporting":[158],"average":[160],"improvement":[161],"10\u201315%":[163],"key":[165],"extraction":[167],"tasks,":[168],"aim":[170],"provide":[172],"researchers":[173],"practitioners":[175],"useful":[177],"guidance":[178],"selecting":[180],"suitable":[183],"solutions":[184],"their":[186],"applications.":[189]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
