{"id":"https://openalex.org/W4304098321","doi":"https://doi.org/10.1145/3503161.3548038","title":"TSRFormer","display_name":"TSRFormer","publication_year":2022,"publication_date":"2022-10-10","ids":{"openalex":"https://openalex.org/W4304098321","doi":"https://doi.org/10.1145/3503161.3548038"},"language":"en","primary_location":{"id":"doi:10.1145/3503161.3548038","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3503161.3548038","pdf_url":null,"source":{"id":"https://openalex.org/S4363608757","display_name":"Proceedings of the 30th ACM International Conference on Multimedia","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013377621","display_name":"Weihong Lin","orcid":"https://orcid.org/0000-0001-7349-1611"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weihong Lin","raw_affiliation_strings":["Microsoft Research Aisa, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft Research Aisa, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082831669","display_name":"Zheng Sun","orcid":"https://orcid.org/0000-0002-7979-0345"},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zheng Sun","raw_affiliation_strings":["University of Chinese Academy of Sciences &amp; CASIA, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences &amp; CASIA, Beijing, China","institution_ids":["https://openalex.org/I4210165038","https://openalex.org/I4210112150"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004114734","display_name":"Chixiang Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chixiang Ma","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100621995","display_name":"Mingze Li","orcid":"https://orcid.org/0000-0001-7721-0768"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingze Li","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108274386","display_name":"Jiawei Wang","orcid":"https://orcid.org/0009-0008-8548-0061"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiawei Wang","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101926391","display_name":"Lei Sun","orcid":"https://orcid.org/0000-0002-4974-9122"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Sun","raw_affiliation_strings":["Microsoft Research Asia, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039662070","display_name":"Qiang Huo","orcid":"https://orcid.org/0000-0003-2464-6482"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Huo","raw_affiliation_strings":["Microsoft Research Asia, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5013377621"],"corresponding_institution_ids":["https://openalex.org/I4210113369"],"apc_list":null,"apc_paid":null,"fwci":2.4779,"has_fulltext":false,"cited_by_count":47,"citation_normalized_percentile":{"value":0.92695393,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"6473","last_page":"6482"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14319","display_name":"Currency Recognition and Detection","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.743281900882721},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6306575536727905},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5570328831672668},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5385964512825012},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5004348754882812},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4949144721031189},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4693635106086731},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4468461573123932},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4420667290687561},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3236052989959717}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.743281900882721},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6306575536727905},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5570328831672668},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5385964512825012},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5004348754882812},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4949144721031189},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4693635106086731},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4468461573123932},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4420667290687561},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3236052989959717},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3503161.3548038","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3503161.3548038","pdf_url":null,"source":{"id":"https://openalex.org/S4363608757","display_name":"Proceedings of the 30th ACM International Conference on Multimedia","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1903029394","https://openalex.org/W2074966879","https://openalex.org/W2134164043","https://openalex.org/W2139872266","https://openalex.org/W2194775991","https://openalex.org/W2518276024","https://openalex.org/W2565639579","https://openalex.org/W2754191212","https://openalex.org/W2780740184","https://openalex.org/W2786162033","https://openalex.org/W2914231536","https://openalex.org/W2963150697","https://openalex.org/W2963351448","https://openalex.org/W2963516811","https://openalex.org/W3003206728","https://openalex.org/W3003496674","https://openalex.org/W3003931580","https://openalex.org/W3003953860","https://openalex.org/W3012573144","https://openalex.org/W3034997246","https://openalex.org/W3096609285","https://openalex.org/W3107064625","https://openalex.org/W3107331169","https://openalex.org/W3109870706","https://openalex.org/W3118722740","https://openalex.org/W3127736880","https://openalex.org/W3134658493","https://openalex.org/W3176384932","https://openalex.org/W3190766843","https://openalex.org/W3203974803","https://openalex.org/W3207083256","https://openalex.org/W3213341651","https://openalex.org/W4214627427","https://openalex.org/W4214693170"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W4321353415","https://openalex.org/W2745001401","https://openalex.org/W2130974462","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W4246352526","https://openalex.org/W2121910908","https://openalex.org/W1996690921","https://openalex.org/W1522196789"],"abstract_inverted_index":{"We":[0],"present":[1],"a":[2,36,48,115,136,200],"new":[3,49,107,152],"table":[4,24,31,69],"structure":[5],"recognition":[6],"(TSR)":[7],"approach,":[8,55],"called":[9],"TSRFormer,":[10],"to":[11,64,97,111,146,177],"robustly":[12],"recognizing":[13],"the":[14,74,83,99,172],"structures":[15],"of":[16,41,103,174],"complex":[17,180],"tables":[18,178],"with":[19,128,179],"geometrical":[20],"distortions":[21],"from":[22,68,114],"various":[23],"images.":[25],"Unlike":[26],"previous":[27],"methods,":[28],"we":[29,88,169],"formulate":[30],"separation":[32,66,84,133],"line":[33,37,85,134],"prediction":[34,54,86],"as":[35,191,193],"regression":[38],"problem":[39,45],"instead":[40],"an":[42],"image":[43],"segmentation":[44],"and":[46,80,166],"propose":[47,89],"two-stage":[50,75],"DETR":[51,76],"based":[52,140],"separator":[53],"dubbed":[56],"Sep":[57],"arator":[58],"RE":[59],"gression":[60],"TR":[61],"ansformer":[62],"(SepRETR),":[63],"predict":[65],"lines":[67],"images":[70],"directly.":[71],"To":[72],"make":[73],"framework":[77],"work":[78],"efficiently":[79],"effectively":[81],"for":[82],"task,":[87],"two":[90],"improvements:":[91],"1)":[92],"A":[93,106],"prior-enhanced":[94],"matching":[95],"strategy":[96],"solve":[98],"slow":[100],"convergence":[101],"issue":[102],"DETR;":[104],"2)":[105],"cross":[108],"attention":[109],"module":[110,143],"sample":[112],"features":[113],"high-resolution":[116],"convolutional":[117],"feature":[118],"map":[119],"directly":[120],"so":[121],"that":[122],"high":[123],"localization":[124],"accuracy":[125],"is":[126,144],"achieved":[127],"low":[129],"computational":[130],"cost.":[131],"After":[132],"prediction,":[135],"simple":[137],"relation":[138],"network":[139],"cell":[141],"merging":[142],"used":[145],"recover":[147],"spanning":[148,189],"cells.":[149],"With":[150],"these":[151],"techniques,":[153],"our":[154,175],"TSRFormer":[155],"achieves":[156],"state-of-the-art":[157],"performance":[158],"on":[159,199],"several":[160],"benchmark":[161],"datasets,":[162],"including":[163],"SciTSR,":[164],"PubTabNet":[165],"WTW.":[167],"Furthermore,":[168],"have":[170],"validated":[171],"robustness":[173],"approach":[176],"structures,":[181],"borderless":[182],"cells,":[183],"large":[184],"blank":[185],"spaces,":[186],"empty":[187],"or":[188,195],"cells":[190],"well":[192],"distorted":[194],"even":[196],"curved":[197],"shapes":[198],"more":[201],"challenging":[202],"real-world":[203],"in-house":[204],"dataset.":[205]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":15},{"year":2023,"cited_by_count":13}],"updated_date":"2026-06-04T09:04:59.091469","created_date":"2022-10-10T00:00:00"}
