{"id":"https://openalex.org/W4287588076","doi":"https://doi.org/10.1109/icip46576.2022.9897699","title":"Polygon-Free: Unconstrained Scene Text Detection with Box Annotations","display_name":"Polygon-Free: Unconstrained Scene Text Detection with Box Annotations","publication_year":2022,"publication_date":"2022-10-16","ids":{"openalex":"https://openalex.org/W4287588076","doi":"https://doi.org/10.1109/icip46576.2022.9897699"},"language":"en","primary_location":{"id":"doi:10.1109/icip46576.2022.9897699","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip46576.2022.9897699","pdf_url":null,"source":{"id":"https://openalex.org/S4363607719","display_name":"2022 IEEE International Conference on Image Processing (ICIP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101634167","display_name":"Weijia Wu","orcid":"https://orcid.org/0000-0003-3912-7212"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weijia Wu","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041031140","display_name":"Enze Xie","orcid":"https://orcid.org/0000-0001-6890-1049"},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Enze Xie","raw_affiliation_strings":["The University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The University of Hong Kong","institution_ids":["https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003608795","display_name":"Ruimao Zhang","orcid":"https://orcid.org/0000-0001-9511-7532"},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruimao Zhang","raw_affiliation_strings":["The Chinese University of Hong Kong,Shenzhen,China","The Chinese University of Hong Kong, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong,Shenzhen,China","institution_ids":["https://openalex.org/I4210116924"]},{"raw_affiliation_string":"The Chinese University of Hong Kong, Shenzhen, China","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101827340","display_name":"Wenhai Wang","orcid":"https://orcid.org/0000-0002-2418-3134"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4391012619","display_name":"Shanghai Artificial Intelligence Laboratory","ror":"https://ror.org/03wkvpx79","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391012619"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenhai Wang","raw_affiliation_strings":["Shanghai Artificial Intelligence Laboratory,China","Shanghai Artificial Intelligence Laboratory, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Artificial Intelligence Laboratory,China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4391012619"]},{"raw_affiliation_string":"Shanghai Artificial Intelligence Laboratory, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4391012619"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100752686","display_name":"Ping Luo","orcid":"https://orcid.org/0000-0002-6685-7950"},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Ping Luo","raw_affiliation_strings":["The University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The University of Hong Kong","institution_ids":["https://openalex.org/I889458895"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043169810","display_name":"Hong Zhou","orcid":"https://orcid.org/0000-0003-1314-8883"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong Zhou","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101634167"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.2996,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.6264794,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1226","last_page":"1230"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.8564635515213013},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.7796599864959717},{"id":"https://openalex.org/keywords/polygon","display_name":"Polygon (computer graphics)","score":0.7728325128555298},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7389549016952515},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7038592100143433},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6090500950813293},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.43259188532829285},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.35492464900016785},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.11059144139289856}],"concepts":[{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.8564635515213013},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.7796599864959717},{"id":"https://openalex.org/C190694206","wikidata":"https://www.wikidata.org/wiki/Q3276654","display_name":"Polygon (computer graphics)","level":3,"score":0.7728325128555298},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7389549016952515},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7038592100143433},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6090500950813293},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.43259188532829285},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35492464900016785},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.11059144139289856},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icip46576.2022.9897699","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip46576.2022.9897699","pdf_url":null,"source":{"id":"https://openalex.org/S4363607719","display_name":"2022 IEEE International Conference on Image Processing (ICIP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1495267108","https://openalex.org/W1849277567","https://openalex.org/W1903029394","https://openalex.org/W1972065312","https://openalex.org/W2144554289","https://openalex.org/W2194775991","https://openalex.org/W2339589954","https://openalex.org/W2343052201","https://openalex.org/W2519818067","https://openalex.org/W2550687635","https://openalex.org/W2605982830","https://openalex.org/W2772800855","https://openalex.org/W2785383245","https://openalex.org/W2875814315","https://openalex.org/W2884585870","https://openalex.org/W2902494497","https://openalex.org/W2962804639","https://openalex.org/W2962810613","https://openalex.org/W2962935569","https://openalex.org/W2963299604","https://openalex.org/W2963647456","https://openalex.org/W2967615747","https://openalex.org/W2991626090","https://openalex.org/W2998621280","https://openalex.org/W3003921261","https://openalex.org/W3005400651","https://openalex.org/W3013262970","https://openalex.org/W6746206475","https://openalex.org/W6775038058"],"related_works":["https://openalex.org/W4237171675","https://openalex.org/W3036286480","https://openalex.org/W4287027631","https://openalex.org/W3192357901","https://openalex.org/W2387360586","https://openalex.org/W2952736415","https://openalex.org/W3209723314","https://openalex.org/W3205398323","https://openalex.org/W2883297582","https://openalex.org/W4390524233"],"abstract_inverted_index":{"Unlike":[0],"existing":[1,24],"works":[2],"that":[3,76,96],"employ":[4],"fully-supervised":[5],"training":[6,133],"with":[7,33,65,105,135],"polygon":[8,115],"annotations,":[9,116,139],"this":[10],"study":[11],"proposes":[12],"an":[13,119],"unconstrained":[14],"text":[15,26],"detection":[16],"system":[17],"termed":[18],"Polygon-free":[19,99],"(PF),":[20],"in":[21],"which":[22],"most":[23],"polygon-based":[25],"detectors":[27],"(e.g.,":[28],"PSENet":[29,117],"[1])":[30],"are":[31],"trained":[32],"only":[34,106],"upright":[35,58,107,136],"bounding":[36,59,108,137],"box":[37,109,138],"annotations.":[38,110],"Our":[39],"core":[40],"idea":[41],"is":[42,62],"to":[43,49,52],"transfer":[44],"knowledge":[45],"from":[46],"synthetic":[47],"data":[48,51],"real":[50],"enhance":[53],"the":[54,97],"supervision":[55],"information":[56],"of":[57,126],"boxes.":[60],"This":[61],"made":[63],"possible":[64],"a":[66],"simple":[67],"segmentation":[68],"network,":[69],"namely":[70],"Skeleton":[71],"Attention":[72],"Segmentation":[73],"Network":[74],"(SASN),":[75],"includes":[77],"three":[78],"vital":[79],"components":[80],"(i.e.,":[81],"channel":[82],"attention,":[83],"spatial":[84],"attention":[85,88],"and":[86,90,140],"skeleton":[87],"map)":[89],"one":[91],"soft":[92],"cross-entropy":[93],"loss.Experiments":[94],"demonstrate":[95],"proposed":[98],"yields":[100],"surprisingly":[101],"high-quality":[102],"pixel-level":[103],"results":[104],"For":[111],"example,":[112],"without":[113],"using":[114],"achieves":[118],"80.5%":[120],"F-score":[121],"on":[122],"TotalText":[123],"(vs.":[124],"80.9%":[125],"fully":[127],"supervised":[128],"counterpart),":[129],"31.1%":[130],"better":[131],"than":[132],"directly":[134],"saves":[141],"80%+":[142],"labeling":[143],"costs.":[144]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
