{"id":"https://openalex.org/W4406458553","doi":"https://doi.org/10.1109/bigdata62323.2024.10825230","title":"Table Structure Recognition via Encoder/Decoder Vision Transformers","display_name":"Table Structure Recognition via Encoder/Decoder Vision Transformers","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406458553","doi":"https://doi.org/10.1109/bigdata62323.2024.10825230"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825230","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825230","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090107422","display_name":"Daniel Uedelhoven","orcid":null},"institutions":[{"id":"https://openalex.org/I4210144576","display_name":"Fraunhofer Institute for Intelligent Analysis and Information Systems","ror":"https://ror.org/04nc32781","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210144576","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Daniel Uedelhoven","raw_affiliation_strings":["Fraunhofer IAIS,Sankt Augustin,Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IAIS,Sankt Augustin,Germany","institution_ids":["https://openalex.org/I4210144576"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039510770","display_name":"Max L\u00fcbbering","orcid":"https://orcid.org/0000-0001-6291-9459"},"institutions":[{"id":"https://openalex.org/I4210144576","display_name":"Fraunhofer Institute for Intelligent Analysis and Information Systems","ror":"https://ror.org/04nc32781","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210144576","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Max L\u00fcbbering","raw_affiliation_strings":["Fraunhofer IAIS,Sankt Augustin,Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IAIS,Sankt Augustin,Germany","institution_ids":["https://openalex.org/I4210144576"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003875445","display_name":"Christian Bauckhage","orcid":"https://orcid.org/0000-0001-6615-2128"},"institutions":[{"id":"https://openalex.org/I4210144576","display_name":"Fraunhofer Institute for Intelligent Analysis and Information Systems","ror":"https://ror.org/04nc32781","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210144576","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christian Bauckhage","raw_affiliation_strings":["Fraunhofer IAIS,Sankt Augustin,Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IAIS,Sankt Augustin,Germany","institution_ids":["https://openalex.org/I4210144576"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034781887","display_name":"Rafet Sifa","orcid":null},"institutions":[{"id":"https://openalex.org/I4210144576","display_name":"Fraunhofer Institute for Intelligent Analysis and Information Systems","ror":"https://ror.org/04nc32781","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210144576","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Rafet Sifa","raw_affiliation_strings":["Fraunhofer IAIS,Sankt Augustin,Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IAIS,Sankt Augustin,Germany","institution_ids":["https://openalex.org/I4210144576"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5090107422"],"corresponding_institution_ids":["https://openalex.org/I4210144576"],"apc_list":null,"apc_paid":null,"fwci":0.2624,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.58740893,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"8855","last_page":"8858"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9696000218391418,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9517999887466431,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7368401885032654},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.7256786227226257},{"id":"https://openalex.org/keywords/lookup-table","display_name":"Lookup table","score":0.5277731418609619},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.5190061330795288},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5158826112747192},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4515969157218933},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.43304187059402466},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.4255644381046295},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.42331624031066895},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.1619769036769867},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.14331060647964478},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1387108862400055},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.12471392750740051},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.07410046458244324}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7368401885032654},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.7256786227226257},{"id":"https://openalex.org/C134835016","wikidata":"https://www.wikidata.org/wiki/Q690265","display_name":"Lookup table","level":2,"score":0.5277731418609619},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.5190061330795288},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5158826112747192},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4515969157218933},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.43304187059402466},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.4255644381046295},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.42331624031066895},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.1619769036769867},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.14331060647964478},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1387108862400055},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.12471392750740051},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.07410046458244324},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825230","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825230","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},{"id":"pmh:oai:publica.fraunhofer.de:publica/483049","is_oa":false,"landing_page_url":"https://publica.fraunhofer.de/handle/publica/483049","pdf_url":null,"source":{"id":"https://openalex.org/S4306400318","display_name":"Fraunhofer-Publica (Fraunhofer-Gesellschaft)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4923324","host_organization_name":"Fraunhofer-Gesellschaft","host_organization_lineage":["https://openalex.org/I4923324"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321408","display_name":"Ministry of Education","ror":"https://ror.org/01p262204"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2022351003","https://openalex.org/W2065429801","https://openalex.org/W2074966879","https://openalex.org/W3034997246","https://openalex.org/W3094502228","https://openalex.org/W3096609285","https://openalex.org/W3217518891","https://openalex.org/W4313156423","https://openalex.org/W4385991106","https://openalex.org/W4394683372"],"related_works":["https://openalex.org/W2798215405","https://openalex.org/W2990962948","https://openalex.org/W2084169748","https://openalex.org/W2127529229","https://openalex.org/W2355515259","https://openalex.org/W4390516098","https://openalex.org/W2124289628","https://openalex.org/W1822998120","https://openalex.org/W2161474341","https://openalex.org/W2363440576"],"abstract_inverted_index":{"Table":[0],"structure":[1,78],"recognition":[2,79],"(TSR),":[3],"the":[4,8,13,25,172,177],"task":[5],"of":[6,10,30,55,63,96,158],"inferring":[7],"layout":[9],"tables,":[11],"including":[12,131],"row,":[14,84],"column,":[15,85],"and":[16,28,48,86,150],"cell":[17,87,118,126],"structure,":[18],"is":[19],"a":[20,51,60,74,93,102,106,145],"surprisingly":[21],"complex":[22],"task.":[23],"With":[24],"growing":[26,61],"amount":[27],"importance":[29],"digital":[31],"documents,":[32],"it":[33],"has":[34,42],"become":[35],"an":[36],"increasingly":[37],"relevant":[38],"problem,":[39],"which":[40,124,134],"nonetheless":[41],"not":[43],"yet":[44],"been":[45,70],"solved":[46],"adequately":[47],"still":[49],"presents":[50,73],"very":[52],"active":[53],"area":[54],"research.":[56],"In":[57],"recent":[58],"years,":[59],"number":[62],"deep-learning-based":[64,76],"approaches":[65],"to":[66,116,143,171],"table":[67,77,90,121],"parsing":[68],"have":[69],"proposed.This":[71],"paper":[72],"novel":[75],"method":[80],"that":[81,147],"can":[82,128,151],"predict":[83,117],"bounds":[88,127],"for":[89,120],"images":[91],"with":[92],"high":[94],"degree":[95],"accuracy.":[97],"To":[98],"achieve":[99],"this":[100],"goal,":[101],"multi-stage":[103],"pipeline":[104],"incorporating":[105],"Vision-Transformer-based":[107],"Autoencoder":[108,179],"model":[109,113,146,173],"was":[110,114,142,182],"devised.":[111],"This":[112],"trained":[115],"regions":[119],"images,":[122],"from":[123],"accurate":[125,153],"be":[129],"inferred,":[130],"spanning":[132],"cells":[133],"cover":[135],"multiple":[136],"rows":[137],"or":[138],"columns.":[139],"The":[140],"goal":[141],"obtain":[144],"generalizes":[148],"well":[149],"return":[152],"predictions":[154],"on":[155],"various":[156],"tables":[157],"differing":[159],"complexity,":[160],"even":[161],"if":[162],"they":[163],"contain":[164],"little":[165],"initial":[166],"structural":[167],"information.An":[168],"additional":[169],"modification":[170],"architecture":[174],"presented":[175],"in":[176],"Masked":[178],"(MAE)":[180],"approach":[181],"also":[183],"evaluated.":[184]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
