{"id":"https://openalex.org/W7125955799","doi":"https://doi.org/10.1109/smc58881.2025.11342634","title":"A Multi-modal Feature Interaction Enhancement Network for Complex Table Structure Recognition","display_name":"A Multi-modal Feature Interaction Enhancement Network for Complex Table Structure Recognition","publication_year":2025,"publication_date":"2025-10-05","ids":{"openalex":"https://openalex.org/W7125955799","doi":"https://doi.org/10.1109/smc58881.2025.11342634"},"language":null,"primary_location":{"id":"doi:10.1109/smc58881.2025.11342634","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11342634","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108047889","display_name":"Y\u00ec W\u00e1ng","orcid":"https://orcid.org/0000-0001-5697-0717"},"institutions":[{"id":"https://openalex.org/I179060312","display_name":"Northeast Electric Power University","ror":"https://ror.org/00zqaxa34","country_code":"CN","type":"education","lineage":["https://openalex.org/I179060312"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingdong Wang","raw_affiliation_strings":["Northeast Electric Power University,School of Computer Science,Jilin,China"],"affiliations":[{"raw_affiliation_string":"Northeast Electric Power University,School of Computer Science,Jilin,China","institution_ids":["https://openalex.org/I179060312"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124131901","display_name":"Peng Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I179060312","display_name":"Northeast Electric Power University","ror":"https://ror.org/00zqaxa34","country_code":"CN","type":"education","lineage":["https://openalex.org/I179060312"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Wang","raw_affiliation_strings":["Northeast Electric Power University,School of Computer Science,Jilin,China"],"affiliations":[{"raw_affiliation_string":"Northeast Electric Power University,School of Computer Science,Jilin,China","institution_ids":["https://openalex.org/I179060312"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124108903","display_name":"Fanqi Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I179060312","display_name":"Northeast Electric Power University","ror":"https://ror.org/00zqaxa34","country_code":"CN","type":"education","lineage":["https://openalex.org/I179060312"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fanqi Meng","raw_affiliation_strings":["Northeast Electric Power University,School of Computer Science,Jilin,China"],"affiliations":[{"raw_affiliation_string":"Northeast Electric Power University,School of Computer Science,Jilin,China","institution_ids":["https://openalex.org/I179060312"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5108047889"],"corresponding_institution_ids":["https://openalex.org/I179060312"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.71727042,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1562","last_page":"1569"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9230999946594238,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9230999946594238,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14319","display_name":"Currency Recognition and Detection","score":0.01140000019222498,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.005799999926239252,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.7149999737739563},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5859000086784363},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5584999918937683},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5317000150680542},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4880000054836273},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.459199994802475},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.45239999890327454},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.38600000739097595},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.3522999882698059}],"concepts":[{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.7149999737739563},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6998999714851379},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.616599977016449},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5859000086784363},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5584999918937683},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5317000150680542},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4880000054836273},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.459199994802475},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.45239999890327454},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.38600000739097595},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3840000033378601},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.3522999882698059},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.34950000047683716},{"id":"https://openalex.org/C2988224531","wikidata":"https://www.wikidata.org/wiki/Q20830730","display_name":"Network structure","level":2,"score":0.31290000677108765},{"id":"https://openalex.org/C34947359","wikidata":"https://www.wikidata.org/wiki/Q665189","display_name":"Complex network","level":2,"score":0.30979999899864197},{"id":"https://openalex.org/C85407183","wikidata":"https://www.wikidata.org/wiki/Q1045785","display_name":"Semantic network","level":2,"score":0.29820001125335693},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2897000014781952},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.2856000065803528},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.28519999980926514},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.2825999855995178},{"id":"https://openalex.org/C12426560","wikidata":"https://www.wikidata.org/wiki/Q189569","display_name":"Basis (linear algebra)","level":2,"score":0.27869999408721924},{"id":"https://openalex.org/C2780551164","wikidata":"https://www.wikidata.org/wiki/Q2306599","display_name":"Column (typography)","level":3,"score":0.27630001306533813},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.2759000062942505},{"id":"https://openalex.org/C104122410","wikidata":"https://www.wikidata.org/wiki/Q1416406","display_name":"Network model","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C153604712","wikidata":"https://www.wikidata.org/wiki/Q7310755","display_name":"Relationship extraction","level":3,"score":0.2667999863624573},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2547000050544739}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/smc58881.2025.11342634","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11342634","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5400709509849548,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W2786162033","https://openalex.org/W2786515133","https://openalex.org/W2998913931","https://openalex.org/W3003931580","https://openalex.org/W3034997246","https://openalex.org/W3107064625","https://openalex.org/W3118722740","https://openalex.org/W3127736880","https://openalex.org/W3134658493","https://openalex.org/W3158362813","https://openalex.org/W3159314278","https://openalex.org/W3167404434","https://openalex.org/W3176384932","https://openalex.org/W3180751782","https://openalex.org/W3201922353","https://openalex.org/W4214693170","https://openalex.org/W4312554912","https://openalex.org/W4375866544","https://openalex.org/W4386066115"],"related_works":[],"abstract_inverted_index":{"Aiming":[0],"to":[1,72,106,115,144,165,174],"the":[2,5,13,68,84,93,101,146,158,167,171,177,181,203,244],"problem":[3,14],"that":[4,188,212],"present":[6],"table":[7,41,85,172,182,208],"structure":[8,28,42,173,209],"recognition":[9,43,168,219,230],"methods":[10,206],"often":[11],"have":[12],"of":[15,19,33,54,70,77,83,96,170,180],"misrecognition":[16],"and":[17,29,49,79,86,138,141,156,199,238],"misalignment":[18],"cells":[20],"when":[21],"facing":[22],"complex":[23,26,40,222],"tables":[24,223],"with":[25,202,243],"row-column":[27],"abundant":[30],"semantic":[31,108,118],"content":[32],"cells,":[34],"this":[35,55,192],"study":[36],"proposes":[37],"a":[38,127],"multi-modal":[39],"network-MTSRN,":[44],"which":[45,133],"integrates":[46],"visual,":[47,136],"textual":[48],"positional":[50,139],"features.":[51],"The":[52,184],"innovation":[53],"method":[56,190,214],"lies":[57],"in,":[58],"firstly,":[59],"adding":[60],"CANN":[61],"image":[62],"visual":[63,81],"feature":[64],"extraction":[65,76],"branch":[66],"on":[67],"basis":[69],"GNN":[71,143],"realize":[73,176],"more":[74,217],"comprehensive":[75],"global":[78],"local":[80],"features":[82,109,148],"forming":[87],"pixel":[88],"location":[89],"network":[90,103],"by":[91],"combining":[92],"relative":[94],"positions":[95],"cells;":[97],"secondly,":[98],"we":[99,125],"construct":[100,126],"integrated":[102],"called":[104,131],"CLAT":[105],"obtain":[107],"among":[110],"text":[111,122],"contents":[112],"in":[113,163,191,196,224,236],"order":[114,164],"accurately":[116],"extract":[117],"connections":[119],"between":[120,161],"cell":[121],"contents;":[123],"finally,":[124],"node":[128],"prediction":[129],"module":[130],"NAPM,":[132],"interactively":[134],"enhances":[135],"semantic,":[137],"features,":[140],"employs":[142],"fuse":[145],"three":[147],"into":[149],"graph":[150],"nodes,":[151,162],"as":[152,154],"well":[153],"predicts":[155],"pairs":[157],"column":[159],"relationships":[160],"enhance":[166],"ability":[169],"eventually":[175],"accurate":[178,218],"reconstruction":[179],"structure.":[183],"experimental":[185],"results":[186,220],"show":[187],"our":[189,213,228],"paper":[193],"has":[194],"advantages":[195],"precision,":[197],"recall":[198],"F1":[200],"compared":[201,242],"current":[204],"popular":[205],"for":[207,221],"recognition,":[210],"proving":[211],"can":[215],"achieve":[216],"realistic":[225],"scenarios.":[226],"Meanwhile,":[227],"designed":[229],"model":[231],"gets":[232],"nearly":[233],"13%":[234],"improvement":[235],"Row_prediction":[237],"Col_prediction":[239],"metrics":[240],"respectively":[241],"baseline":[245],"model.":[246]},"counts_by_year":[],"updated_date":"2026-01-29T23:17:01.242718","created_date":"2026-01-29T00:00:00"}
