{"id":"https://openalex.org/W3160898296","doi":"https://doi.org/10.1109/icpr48806.2021.9413092","title":"Mutually Guided Dual-Task Network for Scene Text Detection","display_name":"Mutually Guided Dual-Task Network for Scene Text Detection","publication_year":2021,"publication_date":"2021-01-10","ids":{"openalex":"https://openalex.org/W3160898296","doi":"https://doi.org/10.1109/icpr48806.2021.9413092","mag":"3160898296"},"language":"en","primary_location":{"id":"doi:10.1109/icpr48806.2021.9413092","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr48806.2021.9413092","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 25th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018871383","display_name":"Mengbiao Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mengbiao Zhao","raw_affiliation_strings":["School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100628393","display_name":"Wei Feng","orcid":"https://orcid.org/0000-0003-3711-6333"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Feng","raw_affiliation_strings":["School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039310938","display_name":"Fei Yin","orcid":"https://orcid.org/0000-0002-6412-9140"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Yin","raw_affiliation_strings":["School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082548671","display_name":"Xu-Yao Zhang","orcid":"https://orcid.org/0000-0001-9260-188X"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu-Yao Zhang","raw_affiliation_strings":["School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100714202","display_name":"Cheng\u2010Lin Liu","orcid":"https://orcid.org/0000-0002-6743-4175"},"institutions":[{"id":"https://openalex.org/I4210097554","display_name":"Center for Excellence in Brain Science and Intelligence Technology","ror":"https://ror.org/00vpwhm04","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210097554"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng-Lin Liu","raw_affiliation_strings":["CAS Center for Excellence of Brain Science and Intelligence Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"CAS Center for Excellence of Brain Science and Intelligence Technology, Beijing, China","institution_ids":["https://openalex.org/I4210097554"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5018871383"],"corresponding_institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.0961,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.36078431,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"6928","last_page":"6934"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9854999780654907,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7976881265640259},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.7428367733955383},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6254059076309204},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.613408625125885},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.6133772134780884},{"id":"https://openalex.org/keywords/line","display_name":"Line (geometry)","score":0.5980045795440674},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5514456629753113},{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.5242862105369568},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4833890497684479},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.45618879795074463},{"id":"https://openalex.org/keywords/attention-network","display_name":"Attention network","score":0.4283018112182617},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3702218532562256},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3445412516593933},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3420429527759552},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.2160569429397583}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7976881265640259},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.7428367733955383},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6254059076309204},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.613408625125885},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.6133772134780884},{"id":"https://openalex.org/C198352243","wikidata":"https://www.wikidata.org/wiki/Q37105","display_name":"Line (geometry)","level":2,"score":0.5980045795440674},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5514456629753113},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.5242862105369568},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4833890497684479},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.45618879795074463},{"id":"https://openalex.org/C2993807640","wikidata":"https://www.wikidata.org/wiki/Q103709453","display_name":"Attention network","level":2,"score":0.4283018112182617},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3702218532562256},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3445412516593933},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3420429527759552},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2160569429397583},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpr48806.2021.9413092","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr48806.2021.9413092","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 25th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.47999998927116394,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G103427903","display_name":null,"funder_award_id":"2019141","funder_id":"https://openalex.org/F4320322847","funder_display_name":"Youth Innovation Promotion Association of the Chinese Academy of Sciences"},{"id":"https://openalex.org/G6737899511","display_name":null,"funder_award_id":"61733007,61573355,61633021,61721004,62076236","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6866922408","display_name":null,"funder_award_id":"ZDBS-LY-7004","funder_id":"https://openalex.org/F4320327616","funder_display_name":"Fundamental Research Funds for the Key Research Program of Chongqing Science and Technology Commission"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322847","display_name":"Youth Innovation Promotion Association of the Chinese Academy of Sciences","ror":"https://ror.org/031141b54"},{"id":"https://openalex.org/F4320327616","display_name":"Fundamental Research Funds for the Key Research Program of Chongqing Science and Technology Commission","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1903029394","https://openalex.org/W2074849287","https://openalex.org/W2108598243","https://openalex.org/W2144554289","https://openalex.org/W2339589954","https://openalex.org/W2464918637","https://openalex.org/W2519818067","https://openalex.org/W2550687635","https://openalex.org/W2565639579","https://openalex.org/W2604735854","https://openalex.org/W2605076167","https://openalex.org/W2605982830","https://openalex.org/W2772800855","https://openalex.org/W2784050770","https://openalex.org/W2785383245","https://openalex.org/W2810028092","https://openalex.org/W2875814315","https://openalex.org/W2902494497","https://openalex.org/W2962773189","https://openalex.org/W2962810613","https://openalex.org/W2962914239","https://openalex.org/W2963150697","https://openalex.org/W2963398399","https://openalex.org/W2963647456","https://openalex.org/W2963807362","https://openalex.org/W2964018263","https://openalex.org/W2988098900","https://openalex.org/W3102695566","https://openalex.org/W3106250896","https://openalex.org/W6620707391","https://openalex.org/W6719590338","https://openalex.org/W6726857151","https://openalex.org/W6729791593","https://openalex.org/W6730903564","https://openalex.org/W6747438827","https://openalex.org/W6752143097","https://openalex.org/W6752731419","https://openalex.org/W6756127406","https://openalex.org/W6756206753","https://openalex.org/W6785652829"],"related_works":["https://openalex.org/W2361861616","https://openalex.org/W2263699433","https://openalex.org/W2377979023","https://openalex.org/W2218034408","https://openalex.org/W2392921965","https://openalex.org/W2358755282","https://openalex.org/W2625833328","https://openalex.org/W1533177136","https://openalex.org/W4380994516","https://openalex.org/W2251519152"],"abstract_inverted_index":{"Scene":[0],"text":[1,13,39,66,97,121,140],"detection":[2,40,60,141],"has":[3,58],"been":[4],"studied":[5],"extensively.":[6],"Existing":[7],"methods":[8],"detect":[9],"either":[10,17],"words":[11,118],"or":[12,19],"lines":[14],"and":[15,37,42,64,110,138,150,154],"use":[16,43],"word-level":[18,36,63,137],"line-level":[20,38,65,139],"annotated":[21],"data":[22,45],"for":[23,62,76,106,119],"training.":[24],"In":[25],"this":[26],"paper,":[27],"we":[28,70],"propose":[29,71],"a":[30,72],"dual-task":[31,56,148],"network":[32,57,149],"that":[33],"can":[34],"perform":[35],"simultaneously":[41],"training":[44,79],"of":[46,49,80,95,117,130,136,145,157],"both":[47],"levels":[48],"annotation":[50],"to":[51,100],"boost":[52],"the":[53,77,81,91,96,103,107,120,126,131,143,146,155],"performance.":[54],"The":[55],"two":[59,82,85],"heads":[61],"detection,":[67],"respectively.":[68],"Then":[69],"mutual":[73,151],"guidance":[74,152],"scheme":[75],"joint":[78],"tasks":[83],"with":[84,162],"modules:":[86],"line":[87,98,122],"filtering":[88],"module":[89,113],"utilizes":[90],"output":[92,127],"feature":[93,128],"map":[94,129],"detector":[99,123],"filter":[101],"out":[102],"non-text":[104],"regions":[105],"word":[108,111,132],"detector,":[109],"enhancing":[112],"provides":[114],"prior":[115],"positions":[116],"depending":[124],"on":[125],"detector.":[133],"Experimental":[134],"results":[135,156],"demonstrate":[142],"effectiveness":[144],"proposed":[147],"scheme,":[153],"our":[158],"method":[159],"are":[160],"competitive":[161],"state-of-the-art":[163],"methods.":[164]},"counts_by_year":[{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
