{"id":"https://openalex.org/W3159307593","doi":"https://doi.org/10.1109/tpami.2021.3077555","title":"PAN++: Towards Efficient and Accurate End-to-End Spotting of Arbitrarily-Shaped Text","display_name":"PAN++: Towards Efficient and Accurate End-to-End Spotting of Arbitrarily-Shaped Text","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3159307593","doi":"https://doi.org/10.1109/tpami.2021.3077555","mag":"3159307593","pmid":"https://pubmed.ncbi.nlm.nih.gov/33945471"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2021.3077555","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2021.3077555","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101827340","display_name":"Wenhai Wang","orcid":"https://orcid.org/0000-0002-2418-3134"},"institutions":[{"id":"https://openalex.org/I163340411","display_name":"Hohai University","ror":"https://ror.org/01wd4xt90","country_code":"CN","type":"education","lineage":["https://openalex.org/I163340411"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenhai Wang","raw_affiliation_strings":["National Key Lab for Novel Software Technology, Nanjing University, 12581 Nanjing, Jiangsu Province, China, (e-mail: wangwenhai362@163.com)"],"affiliations":[{"raw_affiliation_string":"National Key Lab for Novel Software Technology, Nanjing University, 12581 Nanjing, Jiangsu Province, China, (e-mail: wangwenhai362@163.com)","institution_ids":["https://openalex.org/I163340411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041031140","display_name":"Enze Xie","orcid":"https://orcid.org/0000-0001-6890-1049"},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Enze Xie","raw_affiliation_strings":["Computer Science, University of Hong Kong, 25809 Hong Kong, Hong Kong, Hong Kong, (e-mail: xieenze@hku.hk)","[Computer Science, University of Hong Kong, 25809 Hong Kong, Hong Kong, Hong Kong, (e-mail: xieenze@hku.hk)]"],"affiliations":[{"raw_affiliation_string":"Computer Science, University of Hong Kong, 25809 Hong Kong, Hong Kong, Hong Kong, (e-mail: xieenze@hku.hk)","institution_ids":["https://openalex.org/I889458895"]},{"raw_affiliation_string":"[Computer Science, University of Hong Kong, 25809 Hong Kong, Hong Kong, Hong Kong, (e-mail: xieenze@hku.hk)]","institution_ids":["https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100693026","display_name":"Xiang Li","orcid":"https://orcid.org/0000-0002-4996-7365"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiang Li","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, 12436 Nanjing, Jiangsu, China, (e-mail: xiang.li.implus@njust.edu.cn)"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, 12436 Nanjing, Jiangsu, China, (e-mail: xiang.li.implus@njust.edu.cn)","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101599729","display_name":"Xuebo Liu","orcid":"https://orcid.org/0000-0001-8524-2006"},"institutions":[{"id":"https://openalex.org/I2802845136","display_name":"Specim (Finland)","ror":"https://ror.org/019frbz80","country_code":"FI","type":"company","lineage":["https://openalex.org/I2802845136"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Xuebo Liu","raw_affiliation_strings":["OCR Team, SenseTime, Beijing, Beijing, China, (e-mail: lufo816@gmail.com)"],"affiliations":[{"raw_affiliation_string":"OCR Team, SenseTime, Beijing, Beijing, China, (e-mail: lufo816@gmail.com)","institution_ids":["https://openalex.org/I2802845136"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100751872","display_name":"Ding Liang","orcid":"https://orcid.org/0000-0001-9774-4687"},"institutions":[{"id":"https://openalex.org/I4210100200","display_name":"China Internet Network Information Center","ror":"https://ror.org/011t9p927","country_code":"CN","type":"nonprofit","lineage":["https://openalex.org/I4210100200","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ding Liang","raw_affiliation_strings":["OCR Team, SenseTime, Beijing, Beijing, China, (e-mail: liangding@sensetime.com)"],"affiliations":[{"raw_affiliation_string":"OCR Team, SenseTime, Beijing, Beijing, China, (e-mail: liangding@sensetime.com)","institution_ids":["https://openalex.org/I4210100200"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101406829","display_name":"Zhibo Yang","orcid":"https://orcid.org/0000-0003-2343-7750"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Zhibo","raw_affiliation_strings":["Computer Science and Technology, Tsinghua University, 12442 hangzhou, zhejiang, China, (e-mail: yangzhibo450@gmail.com)"],"affiliations":[{"raw_affiliation_string":"Computer Science and Technology, Tsinghua University, 12442 hangzhou, zhejiang, China, (e-mail: yangzhibo450@gmail.com)","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061696740","display_name":"Tong L\u00fc","orcid":"https://orcid.org/0000-0002-7051-5347"},"institutions":[{"id":"https://openalex.org/I134687103","display_name":"Nanjing Tech University","ror":"https://ror.org/03sd35x91","country_code":"CN","type":"education","lineage":["https://openalex.org/I134687103"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tong Lu","raw_affiliation_strings":["National Key Lab for Novel Software Technology, Nanjing University, Nanjing University, 12581 Nanjing, Jiangsu, China, (e-mail: lutong@nju.edu.cn)"],"affiliations":[{"raw_affiliation_string":"National Key Lab for Novel Software Technology, Nanjing University, Nanjing University, 12581 Nanjing, Jiangsu, China, (e-mail: lutong@nju.edu.cn)","institution_ids":["https://openalex.org/I134687103"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006294869","display_name":"Chunhua Shen","orcid":"https://orcid.org/0000-0002-8648-8718"},"institutions":[{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Chunhua Shen","raw_affiliation_strings":["School of Computer Science, Monash University, 2541 Clayton, Victoria, Australia, (e-mail: chunhua.shen@adelaide.edu.au)"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Monash University, 2541 Clayton, Victoria, Australia, (e-mail: chunhua.shen@adelaide.edu.au)","institution_ids":["https://openalex.org/I56590836"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5101827340"],"corresponding_institution_ids":["https://openalex.org/I163340411"],"apc_list":null,"apc_paid":null,"fwci":10.0006,"has_fulltext":false,"cited_by_count":135,"citation_normalized_percentile":{"value":0.98775128,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":100},"biblio":{"volume":"44","issue":"9","first_page":"1","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spotting","display_name":"Spotting","score":0.8965113162994385},{"id":"https://openalex.org/keywords/end-to-end-principle","display_name":"End-to-end principle","score":0.8152782917022705},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6001139879226685},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5919782519340515},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.38372114300727844},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3836970329284668},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3673170506954193},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3203892111778259}],"concepts":[{"id":"https://openalex.org/C2779506182","wikidata":"https://www.wikidata.org/wiki/Q7580141","display_name":"Spotting","level":2,"score":0.8965113162994385},{"id":"https://openalex.org/C74296488","wikidata":"https://www.wikidata.org/wiki/Q2527392","display_name":"End-to-end principle","level":2,"score":0.8152782917022705},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6001139879226685},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5919782519340515},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.38372114300727844},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3836970329284668},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3673170506954193},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3203892111778259}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2021.3077555","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2021.3077555","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:33945471","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33945471","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":80,"referenced_works":["https://openalex.org/W70975097","https://openalex.org/W639708223","https://openalex.org/W1522301498","https://openalex.org/W1686810756","https://openalex.org/W1836465849","https://openalex.org/W1903029394","https://openalex.org/W1972065312","https://openalex.org/W1988461287","https://openalex.org/W2064675550","https://openalex.org/W2074849287","https://openalex.org/W2108598243","https://openalex.org/W2112796928","https://openalex.org/W2122221966","https://openalex.org/W2127141656","https://openalex.org/W2144554289","https://openalex.org/W2153182373","https://openalex.org/W2194187530","https://openalex.org/W2194775991","https://openalex.org/W2239285313","https://openalex.org/W2343052201","https://openalex.org/W2519818067","https://openalex.org/W2532759528","https://openalex.org/W2550687635","https://openalex.org/W2560023338","https://openalex.org/W2565639579","https://openalex.org/W2593539516","https://openalex.org/W2604735854","https://openalex.org/W2605076167","https://openalex.org/W2605982830","https://openalex.org/W2740767790","https://openalex.org/W2772800855","https://openalex.org/W2777652944","https://openalex.org/W2784050770","https://openalex.org/W2785383245","https://openalex.org/W2786962101","https://openalex.org/W2795619303","https://openalex.org/W2810028092","https://openalex.org/W2810983211","https://openalex.org/W2875814315","https://openalex.org/W2896049206","https://openalex.org/W2902494497","https://openalex.org/W2906333459","https://openalex.org/W2962790387","https://openalex.org/W2962810613","https://openalex.org/W2962914239","https://openalex.org/W2962986948","https://openalex.org/W2963150697","https://openalex.org/W2963161243","https://openalex.org/W2963299604","https://openalex.org/W2963353821","https://openalex.org/W2963398399","https://openalex.org/W2963516811","https://openalex.org/W2963647456","https://openalex.org/W2963712589","https://openalex.org/W2963840241","https://openalex.org/W2963857746","https://openalex.org/W2963977642","https://openalex.org/W2964018263","https://openalex.org/W2964065044","https://openalex.org/W2964294787","https://openalex.org/W2964296749","https://openalex.org/W2964444661","https://openalex.org/W2964685115","https://openalex.org/W2965066169","https://openalex.org/W2967615747","https://openalex.org/W2970910956","https://openalex.org/W2981969038","https://openalex.org/W2983626510","https://openalex.org/W2988098900","https://openalex.org/W2991626090","https://openalex.org/W3034792612","https://openalex.org/W3102695566","https://openalex.org/W3106228955","https://openalex.org/W4297775537","https://openalex.org/W6631190155","https://openalex.org/W6637373629","https://openalex.org/W6638667902","https://openalex.org/W6737664043","https://openalex.org/W6739901393","https://openalex.org/W6746206475"],"related_works":["https://openalex.org/W2034439647","https://openalex.org/W4249589822","https://openalex.org/W2103063669","https://openalex.org/W3184921334","https://openalex.org/W4255446307","https://openalex.org/W2033009170","https://openalex.org/W2058491579","https://openalex.org/W1483316057","https://openalex.org/W118429992","https://openalex.org/W4300154353"],"abstract_inverted_index":{"Scene":[0],"text":[1,24,34,45,62,66,80,93,209],"detection":[2,157],"and":[3,18,43,164,179],"recognition":[4,169],"have":[5],"been":[6],"well":[7,96],"explored":[8],"in":[9,49],"the":[10,15,56,105,125,128,176,180,196,203,218,224],"past":[11],"few":[12],"years.":[13],"Despite":[14],"progress,":[16],"efficient":[17,142,167],"accurate":[19],"end-to-end":[20,33,208],"spotting":[21,35,210],"of":[22,46,127,135,147,198,212],"arbitrarily-shaped":[23,92],"remains":[25],"challenging.":[26],"In":[27],"this":[28],"work,":[29],"we":[30,82,131],"propose":[31],"an":[32,166,207],"framework,":[36],"termed":[37],"PAN++,":[38],"which":[39,117,221],"can":[40,88,108],"efficiently":[41],"detect":[42],"recognize":[44],"arbitrary":[47],"shapes":[48],"natural":[50],"scenes.":[51],"PAN++":[52,205],"is":[53,118],"based":[54],"on":[55,217],"kernel":[57,67,86,106,129,177],"representation":[58,87,107,178],"that":[59,84],"reformulates":[60],"a":[61,65,102,112,133,140,155],"line":[63],"as":[64,101,137],"(central":[68],"region)":[69],"surrounded":[70],"by":[71,111],"peripheral":[72],"pixels.":[73],"By":[74],"systematically":[75],"comparing":[76],"with":[77,160,171],"existing":[78],"scene":[79],"representations,":[81],"show":[83,195],"our":[85,183,199],"not":[89],"only":[90],"describe":[91],"but":[94],"also":[95],"distinguish":[97],"adjacent":[98],"text.":[99],"Moreover,":[100],"pixel-based":[103],"representation,":[104,130],"be":[109,230],"predicted":[110],"single":[113],"fully":[114],"convolutional":[115],"network,":[116],"very":[119],"friendly":[120],"to":[121],"real-time":[122],"applications.":[123],"Taking":[124],"advantages":[126],"design":[132],"series":[134],"components":[136],"follows:":[138],"1)":[139],"computationally":[141],"feature":[143],"enhancement":[144],"network":[145],"composed":[146],"stacked":[148],"Feature":[149],"Pyramid":[150],"Enhancement":[151],"Modules":[152],"(FPEMs);":[153],"2)":[154],"lightweight":[156],"head":[158,170],"cooperating":[159],"Pixel":[161],"Aggregation":[162],"(PA);":[163],"3)":[165],"attention-based":[168],"Masked":[172],"RoI.":[173],"Benefiting":[174],"from":[175],"tailored":[181],"components,":[182],"method":[184],"achieves":[185,206],"high":[186],"inference":[187],"speed":[188],"while":[189],"maintaining":[190],"competitive":[191],"accuracy.":[192],"Extensive":[193],"experiments":[194],"superiority":[197],"method.":[200,227],"For":[201],"example,":[202],"proposed":[204],"F-measure":[211],"64.9":[213],"at":[214],"29.2":[215],"FPS":[216],"Total-Text":[219],"dataset,":[220],"significantly":[222],"outperforms":[223],"previous":[225],"best":[226],"Code":[228],"will":[229],"available":[231],"at:":[232],"git.io/PAN.":[233]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":31},{"year":2024,"cited_by_count":47},{"year":2023,"cited_by_count":27},{"year":2022,"cited_by_count":26},{"year":2021,"cited_by_count":3}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
