{"id":"https://openalex.org/W4226041419","doi":"https://doi.org/10.1109/tmm.2022.3165717","title":"SRRV: A Novel Document Object Detector Based on Spatial-Related Relation and Vision","display_name":"SRRV: A Novel Document Object Detector Based on Spatial-Related Relation and Vision","publication_year":2022,"publication_date":"2022-04-07","ids":{"openalex":"https://openalex.org/W4226041419","doi":"https://doi.org/10.1109/tmm.2022.3165717"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2022.3165717","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2022.3165717","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091137994","display_name":"Hengyue Bi","orcid":"https://orcid.org/0000-0002-1578-3576"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hengyue Bi","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-1578-3576","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084189725","display_name":"Canhui Xu","orcid":"https://orcid.org/0000-0002-9907-6747"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Canhui Xu","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-9907-6747","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086704004","display_name":"Cao Shi","orcid":"https://orcid.org/0000-0003-2748-5557"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cao Shi","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0003-2748-5557","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075916788","display_name":"Guozhu Liu","orcid":"https://orcid.org/0000-0002-4191-3186"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guozhu Liu","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-4191-3186","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019981002","display_name":"Yuteng Li","orcid":"https://orcid.org/0000-0002-8880-4526"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuteng Li","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-8880-4526","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100755320","display_name":"Honghong Zhang","orcid":"https://orcid.org/0000-0002-7169-7760"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Honghong Zhang","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-7169-7760","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101661600","display_name":"Jing Qu","orcid":"https://orcid.org/0000-0001-6525-9716"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Qu","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0001-6525-9716","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7261,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.85464851,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"25","issue":null,"first_page":"3788","last_page":"3798"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9801999926567078,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.79219651222229},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6076318025588989},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.566300094127655},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5361127257347107},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.533330500125885},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.528378963470459},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5016119480133057},{"id":"https://openalex.org/keywords/spatial-relation","display_name":"Spatial relation","score":0.48884934186935425},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4734235107898712},{"id":"https://openalex.org/keywords/spatial-analysis","display_name":"Spatial analysis","score":0.4110293686389923},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3486919403076172},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.34295785427093506},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.22177883982658386},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09388437867164612}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.79219651222229},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6076318025588989},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.566300094127655},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5361127257347107},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.533330500125885},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.528378963470459},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5016119480133057},{"id":"https://openalex.org/C27511587","wikidata":"https://www.wikidata.org/wiki/Q2178623","display_name":"Spatial relation","level":2,"score":0.48884934186935425},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4734235107898712},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.4110293686389923},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3486919403076172},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.34295785427093506},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.22177883982658386},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09388437867164612},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2022.3165717","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2022.3165717","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2919925446","display_name":null,"funder_award_id":"61702135","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7273554519","display_name":null,"funder_award_id":"61806107","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W64813323","https://openalex.org/W639708223","https://openalex.org/W1536680647","https://openalex.org/W1686810756","https://openalex.org/W1903029394","https://openalex.org/W1996823523","https://openalex.org/W2147880316","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2288122362","https://openalex.org/W2463598282","https://openalex.org/W2529459268","https://openalex.org/W2549139847","https://openalex.org/W2565639579","https://openalex.org/W2570343428","https://openalex.org/W2588503511","https://openalex.org/W2625219738","https://openalex.org/W2742400085","https://openalex.org/W2785462444","https://openalex.org/W2786162033","https://openalex.org/W2787835872","https://openalex.org/W2803472033","https://openalex.org/W2805199679","https://openalex.org/W2902089218","https://openalex.org/W2922714365","https://openalex.org/W2948519073","https://openalex.org/W2963093690","https://openalex.org/W2963150697","https://openalex.org/W2963450895","https://openalex.org/W2964015378","https://openalex.org/W2964051675","https://openalex.org/W2964094751","https://openalex.org/W2964241181","https://openalex.org/W2964346820","https://openalex.org/W2966316879","https://openalex.org/W2970042171","https://openalex.org/W2973058802","https://openalex.org/W2997154779","https://openalex.org/W2998227124","https://openalex.org/W3003334191","https://openalex.org/W3003711898","https://openalex.org/W3010415660","https://openalex.org/W3034404784","https://openalex.org/W3034514377","https://openalex.org/W3034579518","https://openalex.org/W3048216881","https://openalex.org/W3104953317","https://openalex.org/W3106250896","https://openalex.org/W3121626821","https://openalex.org/W3122111862","https://openalex.org/W3163021734","https://openalex.org/W3200280307","https://openalex.org/W3201049093","https://openalex.org/W3201871940","https://openalex.org/W3208168396","https://openalex.org/W6637373629","https://openalex.org/W6682082992","https://openalex.org/W6684191040","https://openalex.org/W6726873649","https://openalex.org/W6785652829","https://openalex.org/W6797650329"],"related_works":["https://openalex.org/W2358757401","https://openalex.org/W2347703430","https://openalex.org/W3148227991","https://openalex.org/W3001521712","https://openalex.org/W2520082489","https://openalex.org/W2362913948","https://openalex.org/W4309346246","https://openalex.org/W2116266067","https://openalex.org/W2364189591","https://openalex.org/W2028237718"],"abstract_inverted_index":{"Document":[0],"object":[1,12,43],"detection":[2],"is":[3],"a":[4,40],"challenging":[5],"task":[6],"due":[7],"to":[8,111,125],"layout":[9],"complexity":[10],"and":[11,35,49,65,94,135,147,155,170],"diversity.":[13],"Most":[14],"of":[15,54,76,108],"existing":[16],"methods":[17],"mainly":[18],"focus":[19],"on":[20,46,151],"vision":[21,50,57,134],"information,":[22,114],"neglecting":[23],"representative":[24],"inherent":[25],"spatial-related":[26,47],"relationship":[27],"among":[28],"document":[29,42],"objects.":[30],"To":[31],"capture":[32],"structural":[33],"information":[34,74,104,128,163],"contextual":[36],"dependencies,":[37],"we":[38],"propose":[39],"novel":[41],"detector":[44],"based":[45],"relation":[48,61,86,113,127,136,162],"(SRRV).":[51],"It":[52],"consists":[53],"three":[55],"parts:":[56],"feature":[58,62,70,78,82,87,145],"extraction":[59,71],"network,":[60],"aggregation":[63,88],"network":[64,72,89,143],"result":[66,141],"refinement":[67,142],"network.":[68],"Vision":[69],"enhances":[73],"propagation":[75],"hierarchical":[77],"pyramid":[79],"by":[80],"adopting":[81],"augmentation":[83],"paths.":[84],"Then,":[85],"combines":[90],"graph":[91,95,99,116],"construction":[92,100],"module":[93,101,118],"learning":[96,117],"module.":[97],"Specifically,":[98],"calculates":[102],"spatial":[103,161],"from":[105],"geometric":[106],"attributes":[107],"region":[109],"proposals":[110],"encode":[112],"while":[115],"stacks":[119],"Graph":[120],"Convolutional":[121],"Network":[122],"(GCN)":[123],"layers":[124],"aggregate":[126],"at":[129],"global":[130],"scale.":[131],"Both":[132],"the":[133,152,165],"features":[137],"are":[138],"fed":[139],"into":[140],"for":[144],"fusion":[146],"relational":[148],"reasoning.":[149],"Experiments":[150],"PubLayNet,":[153],"POD":[154],"Article":[156],"Regions":[157],"datasets":[158],"demonstrate":[159],"that":[160],"improves":[164],"performance":[166],"with":[167],"better":[168],"accuracy":[169],"more":[171],"precise":[172],"bounding":[173],"box":[174],"prediction.":[175]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
