{"id":"https://openalex.org/W2903483654","doi":"https://doi.org/10.1109/icpr.2018.8545073","title":"Scene Text Detection with Recurrent Instance Segmentation","display_name":"Scene Text Detection with Recurrent Instance Segmentation","publication_year":2018,"publication_date":"2018-08-01","ids":{"openalex":"https://openalex.org/W2903483654","doi":"https://doi.org/10.1109/icpr.2018.8545073","mag":"2903483654"},"language":"en","primary_location":{"id":"doi:10.1109/icpr.2018.8545073","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr.2018.8545073","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 24th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100628393","display_name":"Wei Feng","orcid":"https://orcid.org/0000-0003-3711-6333"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wei Feng","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, P.R. China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, P.R. China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100736473","display_name":"Wenhao He","orcid":"https://orcid.org/0000-0002-3922-5720"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen-Hao He","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, P.R. China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, P.R. China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039310938","display_name":"Fei Yin","orcid":"https://orcid.org/0000-0002-6412-9140"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Yin","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, P.R. China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, P.R. China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100714202","display_name":"Cheng\u2010Lin Liu","orcid":"https://orcid.org/0000-0002-6743-4175"},"institutions":[{"id":"https://openalex.org/I4210097554","display_name":"Center for Excellence in Brain Science and Intelligence Technology","ror":"https://ror.org/00vpwhm04","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210097554"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng-Lin Liu","raw_affiliation_strings":["CAS Center for Excellence of Brain Science and Intelligence Technology, Beijing, P.R. China"],"affiliations":[{"raw_affiliation_string":"CAS Center for Excellence of Brain Science and Intelligence Technology, Beijing, P.R. China","institution_ids":["https://openalex.org/I4210097554"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100628393"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.1459958,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9884999990463257,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9853000044822693,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8377845287322998},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7777180671691895},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7409213781356812},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.6965911388397217},{"id":"https://openalex.org/keywords/text-detection","display_name":"Text detection","score":0.692466139793396},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6459290385246277},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5941380858421326},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.5823898911476135},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5076755285263062},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4570692777633667},{"id":"https://openalex.org/keywords/text-recognition","display_name":"Text recognition","score":0.4519122540950775},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.4462691843509674},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3008853793144226},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.2843669652938843}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8377845287322998},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7777180671691895},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7409213781356812},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.6965911388397217},{"id":"https://openalex.org/C2983589003","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text detection","level":3,"score":0.692466139793396},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6459290385246277},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5941380858421326},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.5823898911476135},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5076755285263062},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4570692777633667},{"id":"https://openalex.org/C2983812711","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text recognition","level":3,"score":0.4519122540950775},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.4462691843509674},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3008853793144226},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2843669652938843},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpr.2018.8545073","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr.2018.8545073","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 24th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.49000000953674316,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W27675589","https://openalex.org/W260801291","https://openalex.org/W607748843","https://openalex.org/W639708223","https://openalex.org/W753012316","https://openalex.org/W1522301498","https://openalex.org/W1533861849","https://openalex.org/W1903029394","https://openalex.org/W1935817682","https://openalex.org/W2008806374","https://openalex.org/W2064675550","https://openalex.org/W2129987527","https://openalex.org/W2144554289","https://openalex.org/W2216125271","https://openalex.org/W2217433794","https://openalex.org/W2239285313","https://openalex.org/W2255466643","https://openalex.org/W2272561391","https://openalex.org/W2339589954","https://openalex.org/W2395360388","https://openalex.org/W2464918637","https://openalex.org/W2472159136","https://openalex.org/W2473415337","https://openalex.org/W2519818067","https://openalex.org/W2550687635","https://openalex.org/W2555182955","https://openalex.org/W2604735854","https://openalex.org/W2605982830","https://openalex.org/W2613718673","https://openalex.org/W2962773189","https://openalex.org/W2962804639","https://openalex.org/W2963150697","https://openalex.org/W2963455537","https://openalex.org/W2963659353","https://openalex.org/W2964100062","https://openalex.org/W2964121744","https://openalex.org/W3106250896","https://openalex.org/W6622239757","https://openalex.org/W6631943919","https://openalex.org/W6689003893","https://openalex.org/W6726857151","https://openalex.org/W6729791593","https://openalex.org/W6785652829"],"related_works":["https://openalex.org/W2740819638","https://openalex.org/W2936226716","https://openalex.org/W2736409883","https://openalex.org/W2964100062","https://openalex.org/W2990832606","https://openalex.org/W2902375677","https://openalex.org/W3199738066","https://openalex.org/W2623546809","https://openalex.org/W2972163838","https://openalex.org/W1489772046","https://openalex.org/W3016205750","https://openalex.org/W2810003256","https://openalex.org/W2970910956","https://openalex.org/W3137197566","https://openalex.org/W2808268865","https://openalex.org/W2964296749","https://openalex.org/W2751748110","https://openalex.org/W2791369865","https://openalex.org/W3136055522","https://openalex.org/W2404161323"],"abstract_inverted_index":{"Convolutional":[0,43],"Neural":[1,48],"Network":[2,49],"(CNN)":[3],"based":[4,40],"scene":[5,54],"text":[6,55,66,85],"detection":[7,56],"methods":[8],"mostly":[9],"employ":[10],"the":[11,19,71,74,103,133,140],"semantic":[12],"segmentation":[13],"(text/non-text":[14],"classification)":[15],"task":[16,138],"to":[17,51,64,79],"localize":[18],"regions":[20],"of":[21,135],"texts.":[22],"However,":[23],"they":[24],"cannot":[25],"distinguish":[26],"different":[27],"text-lines":[28],"like":[29],"instance":[30,58,86],"segmentation.":[31,59],"In":[32],"this":[33],"paper,":[34],"we":[35],"propose":[36],"a":[37,98],"novel":[38],"framework":[39],"on":[41,114],"Fully":[42],"Networks":[44],"(FCN)":[45],"and":[46,57,67,70,82,125],"Recurrent":[47],"(RNN)":[50],"achieve":[52],"both":[53],"The":[60,108],"FCN":[61,78],"is":[62],"used":[63],"classify":[65],"non-text":[68],"regions,":[69],"RNN":[72,141],"utilizes":[73],"features":[75],"extracted":[76],"by":[77,97],"simultaneously":[80],"detect":[81],"segment":[83],"one":[84],"at":[87],"each":[88],"time":[89],"step.":[90],"Meanwhile,":[91],"it":[92],"also":[93],"extracts":[94],"bounding":[95],"boxes":[96],"much":[99],"simpler":[100],"way":[101],"than":[102],"non-maximum":[104],"suppression":[105],"(NMS)":[106],"method.":[107],"proposed":[109],"method":[110],"achieves":[111],"competitive":[112],"results":[113],"two":[115],"public":[116],"benchmarks":[117],"including":[118],"ICDAR":[119,126],"2015":[120],"Incidental":[121],"Scene":[122,129],"Text":[123,130],"Dataset":[124],"2013":[127],"Focused":[128],"Dataset.":[131],"Moreover,":[132],"benefits":[134],"adding":[136],"regression":[137],"in":[139],"module":[142],"are":[143],"manifested.":[144]},"counts_by_year":[{"year":2022,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
