{"id":"https://openalex.org/W4221097663","doi":"https://doi.org/10.1109/tnnls.2022.3152596","title":"Kernel Proposal Network for Arbitrary Shape Text Detection","display_name":"Kernel Proposal Network for Arbitrary Shape Text Detection","publication_year":2022,"publication_date":"2022-03-10","ids":{"openalex":"https://openalex.org/W4221097663","doi":"https://doi.org/10.1109/tnnls.2022.3152596","pmid":"https://pubmed.ncbi.nlm.nih.gov/35271451"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2022.3152596","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3152596","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075041497","display_name":"Shi-Xue Zhang","orcid":"https://orcid.org/0000-0001-7030-1974"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shi-Xue Zhang","raw_affiliation_strings":["School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7030-1974","affiliations":[{"raw_affiliation_string":"School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078514263","display_name":"Xiaobin Zhu","orcid":"https://orcid.org/0000-0003-2702-4136"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaobin Zhu","raw_affiliation_strings":["School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-2702-4136","affiliations":[{"raw_affiliation_string":"School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090213090","display_name":"Jie-Bo Hou","orcid":"https://orcid.org/0000-0002-4632-0160"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie-Bo Hou","raw_affiliation_strings":["School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-4632-0160","affiliations":[{"raw_affiliation_string":"School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101456900","display_name":"Chun Yang","orcid":"https://orcid.org/0000-0001-5262-3048"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chun Yang","raw_affiliation_strings":["School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074514262","display_name":"Xu-Cheng Yin","orcid":"https://orcid.org/0000-0003-0023-0220"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu-Cheng Yin","raw_affiliation_strings":["School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-0023-0220","affiliations":[{"raw_affiliation_string":"School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5075041497"],"corresponding_institution_ids":["https://openalex.org/I92403157"],"apc_list":null,"apc_paid":null,"fwci":3.5714,"has_fulltext":false,"cited_by_count":37,"citation_normalized_percentile":{"value":0.94155797,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"34","issue":"11","first_page":"8731","last_page":"8742"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9884999990463257,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6786302328109741},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.675980806350708},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.671817421913147},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5655909776687622},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5004632472991943},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.49612435698509216},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4846268594264984},{"id":"https://openalex.org/keywords/kernel-method","display_name":"Kernel method","score":0.4549304246902466},{"id":"https://openalex.org/keywords/graph-kernel","display_name":"Graph kernel","score":0.4224071502685547},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3991564214229584},{"id":"https://openalex.org/keywords/kernel-embedding-of-distributions","display_name":"Kernel embedding of distributions","score":0.2281987965106964},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1800190806388855},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.09707766771316528},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.0849587619304657}],"concepts":[{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6786302328109741},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.675980806350708},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.671817421913147},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5655909776687622},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5004632472991943},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.49612435698509216},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4846268594264984},{"id":"https://openalex.org/C122280245","wikidata":"https://www.wikidata.org/wiki/Q620622","display_name":"Kernel method","level":3,"score":0.4549304246902466},{"id":"https://openalex.org/C100595998","wikidata":"https://www.wikidata.org/wiki/Q11731931","display_name":"Graph kernel","level":5,"score":0.4224071502685547},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3991564214229584},{"id":"https://openalex.org/C134517425","wikidata":"https://www.wikidata.org/wiki/Q16000131","display_name":"Kernel embedding of distributions","level":4,"score":0.2281987965106964},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1800190806388855},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.09707766771316528},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.0849587619304657},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2022.3152596","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3152596","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:35271451","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35271451","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5400000214576721,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G2141617675","display_name":null,"funder_award_id":"62076024","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2379300237","display_name":null,"funder_award_id":"2020AAA09701","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G2903026367","display_name":null,"funder_award_id":"62172035","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G356227064","display_name":null,"funder_award_id":"62006018","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4738090328","display_name":null,"funder_award_id":"61806017","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8772010899","display_name":null,"funder_award_id":"62125601","funder_id":"https://openalex.org/F4320336125","funder_display_name":"National Science Fund for Distinguished Young Scholars"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320336125","display_name":"National Science Fund for Distinguished Young Scholars","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1522301498","https://openalex.org/W1901129140","https://openalex.org/W1903029394","https://openalex.org/W2074849287","https://openalex.org/W2144554289","https://openalex.org/W2194775991","https://openalex.org/W2504335775","https://openalex.org/W2519818067","https://openalex.org/W2550687635","https://openalex.org/W2565639579","https://openalex.org/W2593539516","https://openalex.org/W2604735854","https://openalex.org/W2605076167","https://openalex.org/W2605982830","https://openalex.org/W2766895242","https://openalex.org/W2772800855","https://openalex.org/W2784050770","https://openalex.org/W2785383245","https://openalex.org/W2810028092","https://openalex.org/W2884131745","https://openalex.org/W2902494497","https://openalex.org/W2914492226","https://openalex.org/W2953606406","https://openalex.org/W2953894958","https://openalex.org/W2962770929","https://openalex.org/W2962810613","https://openalex.org/W2962914239","https://openalex.org/W2963150697","https://openalex.org/W2963161243","https://openalex.org/W2963187132","https://openalex.org/W2963195262","https://openalex.org/W2963299604","https://openalex.org/W2963351448","https://openalex.org/W2963353821","https://openalex.org/W2963516811","https://openalex.org/W2963623257","https://openalex.org/W2963647456","https://openalex.org/W2964018263","https://openalex.org/W2964685115","https://openalex.org/W2967591398","https://openalex.org/W2967615747","https://openalex.org/W2968226676","https://openalex.org/W2982770724","https://openalex.org/W2988098900","https://openalex.org/W2989604896","https://openalex.org/W2991405684","https://openalex.org/W2991626090","https://openalex.org/W2998621280","https://openalex.org/W3012573144","https://openalex.org/W3034514377","https://openalex.org/W3034792612","https://openalex.org/W3035679705","https://openalex.org/W3043531819","https://openalex.org/W3093046205","https://openalex.org/W3093600664","https://openalex.org/W3102695566","https://openalex.org/W3106228955","https://openalex.org/W3106546328","https://openalex.org/W3110398855","https://openalex.org/W3118957360","https://openalex.org/W3124566001","https://openalex.org/W3172799005","https://openalex.org/W3181016597","https://openalex.org/W3184364189","https://openalex.org/W6631190155","https://openalex.org/W6753441378","https://openalex.org/W6784930956"],"related_works":["https://openalex.org/W2089892314","https://openalex.org/W1603091392","https://openalex.org/W2574115973","https://openalex.org/W2179275589","https://openalex.org/W1983263273","https://openalex.org/W2121506664","https://openalex.org/W2189183545","https://openalex.org/W1558903433","https://openalex.org/W2974741803","https://openalex.org/W2093878082"],"abstract_inverted_index":{"Segmentation-based":[0],"methods":[1],"have":[2],"achieved":[3],"great":[4],"success":[5],"for":[6,45,91,166],"arbitrary":[7,46,75],"shape":[8,47,76],"text":[9,14,48,56,77,93,172,183,220,223],"detection.":[10,49,224],"However,":[11],"separating":[12],"neighboring":[13,55,182,219],"instances":[15,57,184,221],"is":[16,200],"still":[17],"one":[18],"of":[19,28,103,171,195,218,236],"the":[20,26,68,112,124,187,193,201,205,215,231],"most":[21],"challenging":[22,228],"problems":[23],"due":[24],"to":[25,99,117,203,210],"complexity":[27],"texts":[29,61],"in":[30,73,222],"scene":[31],"images.":[32],"In":[33,174],"this":[34,175],"article,":[35],"we":[36,129],"propose":[37,130],"an":[38],"innovative":[39],"kernel":[40,105,127,142,157,208],"proposal":[41],"network":[42,149],"(dubbed":[43],"KPN)":[44],"The":[50,239],"proposed":[51],"KPN":[52,84,178],"can":[53,179],"separate":[54,181],"by":[58,148,153],"classifying":[59],"different":[60],"into":[62],"instance-independent":[63],"feature":[64,114,164],"maps,":[65],"meanwhile":[66],"avoiding":[67],"complex":[69],"aggregation":[70],"process":[71],"existing":[72],"segmentation-based":[74],"detection":[78],"methods.":[79],"To":[80,122,192],"be":[81,97],"concrete,":[82],"our":[83,141,177,196,198,237],"will":[85,96,159],"predict":[86],"a":[87,101,131],"Gaussian":[88],"center":[89],"map":[90],"each":[92],"image,":[94],"which":[95],"used":[98],"extract":[100],"series":[102],"candidate":[104],"proposals":[106,143,158],"(i.e.,":[107],"dynamic":[108,206],"convolution":[109,207],"kernel)":[110],"from":[111],"embedding":[113,163],"maps":[115,165,170],"according":[116],"their":[118],"corresponding":[119],"keypoint":[120],"positions.":[121],"enforce":[123],"independence":[125],"between":[126],"proposals,":[128],"novel":[132],"orthogonal":[133,138],"learning":[134],"loss":[135],"(OLL)":[136],"via":[137],"constraints.":[139],"Specifically,":[140],"contain":[144],"important":[145],"self-information":[146],"learned":[147],"and":[150,185,212,234,241],"location":[151],"information":[152],"position":[154],"embedding.":[155],"Finally,":[156],"individually":[160],"convolve":[161],"all":[162],"generating":[167],"individual":[168],"embedded":[169],"instances.":[173],"way,":[176],"effectively":[180,213],"improve":[186],"robustness":[188],"against":[189],"unclear":[190],"boundaries.":[191],"best":[194],"knowledge,":[197],"work":[199],"first":[202],"introduce":[204],"strategy":[209],"efficiently":[211],"tackle":[214],"adhesion":[216],"problem":[217],"Experimental":[225],"results":[226],"on":[227],"datasets":[229],"verify":[230],"impressive":[232],"performance":[233],"efficiency":[235],"method.":[238],"code":[240],"model":[242],"are":[243],"available":[244],"at":[245],"https://github.com/GXYM/KPN.":[246]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":20},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
