{"id":"https://openalex.org/W2574887079","doi":"https://doi.org/10.1109/tip.2017.2656474","title":"Scene Text Detection and Segmentation Based on Cascaded Convolution Neural Networks","display_name":"Scene Text Detection and Segmentation Based on Cascaded Convolution Neural Networks","publication_year":2017,"publication_date":"2017-01-20","ids":{"openalex":"https://openalex.org/W2574887079","doi":"https://doi.org/10.1109/tip.2017.2656474","mag":"2574887079","pmid":"https://pubmed.ncbi.nlm.nih.gov/28113342"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2017.2656474","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2017.2656474","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081658414","display_name":"Youbao Tang","orcid":"https://orcid.org/0000-0001-8719-3375"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Youbao Tang","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030966569","display_name":"Xiangqian Wu","orcid":"https://orcid.org/0000-0002-0956-8757"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangqian Wu","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5081658414"],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":5.0807,"has_fulltext":false,"cited_by_count":107,"citation_normalized_percentile":{"value":0.97215016,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"26","issue":"3","first_page":"1509","last_page":"1520"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8469383120536804},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7739015817642212},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7673004865646362},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7059093713760376},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.6665016412734985},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6329238414764404},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.602279543876648},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5390607118606567},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.48626863956451416},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.41322046518325806},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3806105852127075}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8469383120536804},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7739015817642212},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7673004865646362},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7059093713760376},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.6665016412734985},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6329238414764404},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.602279543876648},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5390607118606567},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.48626863956451416},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.41322046518325806},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3806105852127075},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2017.2656474","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2017.2656474","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:28113342","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/28113342","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4099999964237213,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G3670463147","display_name":null,"funder_award_id":"61672194","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4581562623","display_name":null,"funder_award_id":"61472102","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":69,"referenced_works":["https://openalex.org/W70975097","https://openalex.org/W117491841","https://openalex.org/W776682613","https://openalex.org/W845365781","https://openalex.org/W1026856040","https://openalex.org/W1488125194","https://openalex.org/W1521064364","https://openalex.org/W1745334888","https://openalex.org/W1903029394","https://openalex.org/W1922126009","https://openalex.org/W1935817682","https://openalex.org/W1967140047","https://openalex.org/W1972065312","https://openalex.org/W1978729128","https://openalex.org/W1979122072","https://openalex.org/W1988461287","https://openalex.org/W1992257524","https://openalex.org/W1995790019","https://openalex.org/W1998042868","https://openalex.org/W1999284580","https://openalex.org/W2008806374","https://openalex.org/W2018451638","https://openalex.org/W2023415694","https://openalex.org/W2042536265","https://openalex.org/W2049951199","https://openalex.org/W2056435187","https://openalex.org/W2061802763","https://openalex.org/W2065613686","https://openalex.org/W2083954025","https://openalex.org/W2084594934","https://openalex.org/W2122221966","https://openalex.org/W2124404372","https://openalex.org/W2128854450","https://openalex.org/W2131163834","https://openalex.org/W2131447359","https://openalex.org/W2131673214","https://openalex.org/W2132952954","https://openalex.org/W2135231474","https://openalex.org/W2137718414","https://openalex.org/W2142159465","https://openalex.org/W2144554289","https://openalex.org/W2148214126","https://openalex.org/W2155893237","https://openalex.org/W2166949156","https://openalex.org/W2168894214","https://openalex.org/W2217433794","https://openalex.org/W2239285313","https://openalex.org/W2300131423","https://openalex.org/W2333563142","https://openalex.org/W2339589954","https://openalex.org/W2343052201","https://openalex.org/W2416007705","https://openalex.org/W2468724597","https://openalex.org/W2472159136","https://openalex.org/W2519818067","https://openalex.org/W2607333215","https://openalex.org/W2963606038","https://openalex.org/W6602936574","https://openalex.org/W6604768502","https://openalex.org/W6622384153","https://openalex.org/W6626567896","https://openalex.org/W6629021407","https://openalex.org/W6631165897","https://openalex.org/W6642972425","https://openalex.org/W6649973027","https://openalex.org/W6679774445","https://openalex.org/W6684665197","https://openalex.org/W6702842988","https://openalex.org/W6726857151"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W2745001401","https://openalex.org/W4321353415","https://openalex.org/W2130974462","https://openalex.org/W972276598","https://openalex.org/W4246352526","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W2087343574","https://openalex.org/W2964954556"],"abstract_inverted_index":{"Scene":[0],"text":[1,26,45,94,116,141,172],"detection":[2,27,51,173],"and":[3,8,28,56,62,102,167,174],"segmentation":[4,29,81,175],"are":[5,72,107,118,123,149],"two":[6],"important":[7],"challenging":[9],"research":[10],"problems":[11],"in":[12],"the":[13,60,63,90,97,139,161],"field":[14],"of":[15,66,144],"computer":[16],"vision.":[17],"This":[18],"paper":[19],"proposes":[20],"a":[21,40,127],"novel":[22],"method":[23,163],"for":[24],"scene":[25,171],"based":[30,42,76,129,147],"on":[31,155],"cascaded":[32],"convolution":[33],"neural":[34],"networks":[35],"(CNNs).":[36],"In":[37],"this":[38],"method,":[39],"CNN":[41,75,128,146],"text-aware":[43],"candidate":[44],"region":[46],"(CTR)":[47],"extraction":[48],"model":[49,79,132],"(named":[50,80,133],"network,":[52,82,135],"DNet)":[53],"is":[54,84],"designed":[55],"trained":[57],"using":[58,126],"both":[59],"edges":[61],"whole":[64],"regions":[65,117],"text,":[67],"with":[68,110],"which":[69],"coarse":[70,91],"CTRs":[71,92,106,122],"detected.":[73],"A":[74],"CTR":[77,130],"refinement":[78],"SNet)":[83],"then":[85],"constructed":[86],"to":[87,95,137],"precisely":[88],"segment":[89],"into":[93],"get":[96,138],"refined":[98,121],"CTRs.":[99],"With":[100],"DNet":[101],"SNet,":[103],"much":[104],"fewer":[105],"extracted":[108],"than":[109],"traditional":[111],"approaches":[112],"while":[113],"more":[114],"true":[115],"kept.":[119],"The":[120],"finally":[124],"classified":[125],"classification":[131,134],"CNet)":[136],"final":[140],"regions.":[142],"All":[143],"these":[145],"models":[148],"modified":[150],"from":[151],"VGGNet-16.":[152],"Extensive":[153],"experiments":[154],"three":[156],"benchmark":[157],"datasets":[158],"demonstrate":[159],"that":[160],"proposed":[162],"achieves":[164],"state-of-the-art":[165],"performance":[166],"greatly":[168],"outperforms":[169],"other":[170],"approaches.":[176]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":13},{"year":2021,"cited_by_count":16},{"year":2020,"cited_by_count":14},{"year":2019,"cited_by_count":28},{"year":2018,"cited_by_count":10},{"year":2017,"cited_by_count":3}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
