{"id":"https://openalex.org/W3199738066","doi":"https://doi.org/10.1109/tip.2021.3113157","title":"Semi-Supervised Pixel-Level Scene Text Segmentation by Mutually Guided Network","display_name":"Semi-Supervised Pixel-Level Scene Text Segmentation by Mutually Guided Network","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3199738066","doi":"https://doi.org/10.1109/tip.2021.3113157","mag":"3199738066","pmid":"https://pubmed.ncbi.nlm.nih.gov/34546922"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2021.3113157","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2021.3113157","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100443606","display_name":"Chuan Wang","orcid":"https://orcid.org/0000-0002-8559-4519"},"institutions":[{"id":"https://openalex.org/I4401726805","display_name":"Megvii (China)","ror":"https://ror.org/040b32p69","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726805"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chuan Wang","raw_affiliation_strings":["Megvii Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Megvii Technology, Beijing, China","institution_ids":["https://openalex.org/I4401726805"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102008113","display_name":"Shan Zhao","orcid":"https://orcid.org/0000-0003-2296-4284"},"institutions":[{"id":"https://openalex.org/I4401726805","display_name":"Megvii (China)","ror":"https://ror.org/040b32p69","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726805"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shan Zhao","raw_affiliation_strings":["Megvii Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Megvii Technology, Beijing, China","institution_ids":["https://openalex.org/I4401726805"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101875601","display_name":"Li Zhu","orcid":"https://orcid.org/0000-0002-2532-2087"},"institutions":[{"id":"https://openalex.org/I10535382","display_name":"Chongqing University of Posts and Telecommunications","ror":"https://ror.org/03dgaqz26","country_code":"CN","type":"education","lineage":["https://openalex.org/I10535382"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Zhu","raw_affiliation_strings":["Chongqing University of Posts and Telecommunications, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"Chongqing University of Posts and Telecommunications, Chongqing, China","institution_ids":["https://openalex.org/I10535382"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101672879","display_name":"Kunming Luo","orcid":"https://orcid.org/0000-0002-5070-7392"},"institutions":[{"id":"https://openalex.org/I4401726805","display_name":"Megvii (China)","ror":"https://ror.org/040b32p69","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726805"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kunming Luo","raw_affiliation_strings":["Megvii Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Megvii Technology, Beijing, China","institution_ids":["https://openalex.org/I4401726805"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009275869","display_name":"Yanwen Guo","orcid":"https://orcid.org/0000-0002-7605-5206"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanwen Guo","raw_affiliation_strings":["National Key Lab for Novel Software Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"National Key Lab for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100440604","display_name":"Jue Wang","orcid":"https://orcid.org/0000-0002-3641-3136"},"institutions":[{"id":"https://openalex.org/I4401726805","display_name":"Megvii (China)","ror":"https://ror.org/040b32p69","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726805"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jue Wang","raw_affiliation_strings":["Megvii Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Megvii Technology, Beijing, China","institution_ids":["https://openalex.org/I4401726805"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039387461","display_name":"Shuaicheng Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuaicheng Liu","raw_affiliation_strings":["University of Electronic Science and Technology of China, Chengdu, China. (e-mail: liushuaicheng@uestc.edu.cn)"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, China. (e-mail: liushuaicheng@uestc.edu.cn)","institution_ids":["https://openalex.org/I150229711"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100443606"],"corresponding_institution_ids":["https://openalex.org/I4401726805"],"apc_list":null,"apc_paid":null,"fwci":2.129,"has_fulltext":false,"cited_by_count":28,"citation_normalized_percentile":{"value":0.89368264,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"30","issue":null,"first_page":"8212","last_page":"8221"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7839940786361694},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7691110372543335},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7452289462089539},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.7348318696022034},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5505927205085754},{"id":"https://openalex.org/keywords/polygon","display_name":"Polygon (computer graphics)","score":0.5326492190361023},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.49172165989875793},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4752112329006195},{"id":"https://openalex.org/keywords/text-detection","display_name":"Text detection","score":0.45420169830322266},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.39475977420806885}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7839940786361694},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7691110372543335},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7452289462089539},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.7348318696022034},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5505927205085754},{"id":"https://openalex.org/C190694206","wikidata":"https://www.wikidata.org/wiki/Q3276654","display_name":"Polygon (computer graphics)","level":3,"score":0.5326492190361023},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.49172165989875793},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4752112329006195},{"id":"https://openalex.org/C2983589003","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text detection","level":3,"score":0.45420169830322266},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.39475977420806885},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2021.3113157","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2021.3113157","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:34546922","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/34546922","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4883897726","display_name":null,"funder_award_id":"61872067","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5269616794","display_name":null,"funder_award_id":"61720106004","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8213391892","display_name":null,"funder_award_id":"2019YFH0016","funder_id":"https://openalex.org/F4320333335","funder_display_name":"Sichuan Province Science and Technology Support Program"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320333335","display_name":"Sichuan Province Science and Technology Support Program","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1491389626","https://openalex.org/W1536680647","https://openalex.org/W1901129140","https://openalex.org/W1971822075","https://openalex.org/W1998042868","https://openalex.org/W2008806374","https://openalex.org/W2099247484","https://openalex.org/W2124404372","https://openalex.org/W2142159465","https://openalex.org/W2146835493","https://openalex.org/W2194187530","https://openalex.org/W2253806798","https://openalex.org/W2339589954","https://openalex.org/W2343052201","https://openalex.org/W2395611524","https://openalex.org/W2464918637","https://openalex.org/W2550687635","https://openalex.org/W2593539516","https://openalex.org/W2605982830","https://openalex.org/W2613718673","https://openalex.org/W2630837129","https://openalex.org/W2766895242","https://openalex.org/W2785383245","https://openalex.org/W2810983211","https://openalex.org/W2886714066","https://openalex.org/W2916797271","https://openalex.org/W2921406441","https://openalex.org/W2962773189","https://openalex.org/W2962810613","https://openalex.org/W2963253279","https://openalex.org/W2963299604","https://openalex.org/W2963677766","https://openalex.org/W2963687373","https://openalex.org/W2963881378","https://openalex.org/W2984016939","https://openalex.org/W2991090032","https://openalex.org/W3034263000","https://openalex.org/W3094664776","https://openalex.org/W3103010481","https://openalex.org/W3106228955","https://openalex.org/W3106250896","https://openalex.org/W4295246343","https://openalex.org/W6620707391","https://openalex.org/W6629590909","https://openalex.org/W6639824700","https://openalex.org/W6649973027","https://openalex.org/W6691603626","https://openalex.org/W6719590338","https://openalex.org/W6729791593","https://openalex.org/W6739696289","https://openalex.org/W6747438827","https://openalex.org/W6754138625","https://openalex.org/W6785652829"],"related_works":["https://openalex.org/W4285411112","https://openalex.org/W2085033728","https://openalex.org/W2171299904","https://openalex.org/W4390494008","https://openalex.org/W2922442631","https://openalex.org/W4380153838","https://openalex.org/W2053596378","https://openalex.org/W2168523118","https://openalex.org/W2383204375","https://openalex.org/W1522196789"],"abstract_inverted_index":{"In":[0],"this":[1,59,71],"paper":[2],"we":[3,61,90],"present":[4],"a":[5,15,25,92,98,105,129],"new":[6],"data-driven":[7],"method":[8],"for":[9,54,119],"pixel-level":[10,37,51,106,156],"scene":[11,20,157],"text":[12,21,26,38,63,78,107,158,172],"segmentation":[13,39],"from":[14],"single":[16],"natural":[17],"image.":[18],"Although":[19],"detection,":[22],"i.e.":[23],"producing":[24],"region":[27,64,79],"mask,":[28],"has":[29],"been":[30],"well":[31],"studied":[32],"in":[33,101,109,155],"the":[34,47,110,123,139,153,163,171,176],"past":[35],"decade,":[36],"is":[40,81,126],"still":[41],"an":[42,67],"open":[43],"problem":[44],"due":[45],"to":[46,137],"lack":[48],"of":[49,76,141],"massive":[50],"labeled":[52,77],"data":[53,69],"supervised":[55],"training.":[56],"To":[57,87],"tackle":[58],"issue,":[60],"incorporate":[62],"mask":[65,80,100,108,164],"as":[66,117],"auxiliary":[68],"into":[70],"task,":[72],"considering":[73],"acquiring":[74],"large-scale":[75],"commonly":[82],"less":[83],"expensive":[84],"and":[85,104,122,146],"time-consuming.":[86],"be":[88],"specific,":[89],"propose":[91],"mutually":[93,143],"guided":[94,144],"network":[95,125,151,168],"which":[96],"produces":[97],"polygon-level":[99],"one":[102],"branch":[103],"other.":[111],"The":[112],"two":[113],"branches'":[114],"outputs":[115],"serve":[116],"guidance":[118],"each":[120],"other":[121],"whole":[124],"trained":[127],"via":[128],"semi-supervised":[130],"learning":[131],"strategy.":[132],"Extensive":[133],"experiments":[134],"are":[135],"conducted":[136],"demonstrate":[138,162],"effectiveness":[140],"our":[142,150,167],"network,":[145],"experimental":[147],"results":[148],"show":[149],"outperforms":[152],"state-of-the-art":[154],"segmentation.":[159],"We":[160],"also":[161],"produced":[165],"by":[166],"could":[169],"improve":[170],"recognition":[173],"performance":[174],"besides":[175],"trivial":[177],"image":[178],"editing":[179],"application.":[180]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-06T13:50:29.536080","created_date":"2025-10-10T00:00:00"}
