{"id":"https://openalex.org/W4392903971","doi":"https://doi.org/10.1109/icassp48485.2024.10448354","title":"EK-Net:Real-Time Scene Text Detection with Expand Kernel Distance","display_name":"EK-Net:Real-Time Scene Text Detection with Expand Kernel Distance","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392903971","doi":"https://doi.org/10.1109/icassp48485.2024.10448354"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10448354","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10448354","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035265584","display_name":"Boyuan Zhu","orcid":"https://orcid.org/0000-0002-3822-059X"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Boyuan Zhu","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","School of Computer Science and Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005463262","display_name":"Fagui Liu","orcid":"https://orcid.org/0000-0003-1135-4982"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fagui Liu","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","Peng Cheng Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100329980","display_name":"Xi Chen","orcid":"https://orcid.org/0000-0002-7790-9066"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xi Chen","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","School of Computer Science and Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5107809180","display_name":"Quan Tang","orcid":"https://orcid.org/0009-0008-3075-4758"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Quan Tang","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","School of Computer Science and Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5035265584"],"corresponding_institution_ids":["https://openalex.org/I90610280"],"apc_list":null,"apc_paid":null,"fwci":1.3121,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.80057289,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"6380","last_page":"6384"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.7698675394058228},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7456585764884949},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.5946747064590454},{"id":"https://openalex.org/keywords/curvature","display_name":"Curvature","score":0.5829506516456604},{"id":"https://openalex.org/keywords/net","display_name":"Net (polyhedron)","score":0.5794803500175476},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5684120655059814},{"id":"https://openalex.org/keywords/clipping","display_name":"Clipping (morphology)","score":0.544161319732666},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37922751903533936},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.36204513907432556},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3278994560241699},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.18503957986831665},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18425479531288147},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.07998979091644287}],"concepts":[{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.7698675394058228},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7456585764884949},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.5946747064590454},{"id":"https://openalex.org/C195065555","wikidata":"https://www.wikidata.org/wiki/Q214881","display_name":"Curvature","level":2,"score":0.5829506516456604},{"id":"https://openalex.org/C14166107","wikidata":"https://www.wikidata.org/wiki/Q253829","display_name":"Net (polyhedron)","level":2,"score":0.5794803500175476},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5684120655059814},{"id":"https://openalex.org/C2776848632","wikidata":"https://www.wikidata.org/wiki/Q853463","display_name":"Clipping (morphology)","level":2,"score":0.544161319732666},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37922751903533936},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.36204513907432556},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3278994560241699},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.18503957986831665},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18425479531288147},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.07998979091644287},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10448354","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10448354","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1922126009","https://openalex.org/W2074849287","https://openalex.org/W2144554289","https://openalex.org/W2193145675","https://openalex.org/W2302255633","https://openalex.org/W2507296351","https://openalex.org/W2550687635","https://openalex.org/W2604243686","https://openalex.org/W2784050770","https://openalex.org/W2899996070","https://openalex.org/W2914492226","https://openalex.org/W2963150697","https://openalex.org/W2963398399","https://openalex.org/W2991626090","https://openalex.org/W2998621280","https://openalex.org/W3102695566","https://openalex.org/W3106250896","https://openalex.org/W3132296545","https://openalex.org/W3159307593","https://openalex.org/W3160791979","https://openalex.org/W3172799005","https://openalex.org/W3181016597","https://openalex.org/W3204222996","https://openalex.org/W3208795278","https://openalex.org/W4214922754","https://openalex.org/W4286696412","https://openalex.org/W6752534923","https://openalex.org/W6802541184"],"related_works":["https://openalex.org/W2035130982","https://openalex.org/W4255837520","https://openalex.org/W2912321008","https://openalex.org/W2387011115","https://openalex.org/W1998607122","https://openalex.org/W55883722","https://openalex.org/W3198205105","https://openalex.org/W2956000802","https://openalex.org/W3198227724","https://openalex.org/W110878719"],"abstract_inverted_index":{"Recently,":[0],"scene":[1],"text":[2,76],"detection":[3,15,29],"has":[4],"received":[5],"significant":[6],"attention":[7],"due":[8],"to":[9,40,63,95,105,140],"its":[10],"wide":[11],"application.":[12],"However,":[13],"accurate":[14],"in":[16,66],"complex":[17],"scenes":[18],"of":[19,44,117,146,155],"multiple":[20],"scales,":[21],"orientations,":[22],"and":[23,127],"curvature":[24],"remains":[25],"a":[26,64,83,123],"challenge.":[27],"Numerous":[28],"methods":[30],"adopt":[31],"the":[32,42,57,75,98,114],"Vatti":[33],"clipping":[34],"(VC)":[35],"algorithm":[36],"for":[37,97],"multiple-instance":[38],"training":[39],"address":[41],"issue":[43],"arbitrary-shaped":[45,118],"text.":[46],"Yet":[47],"we":[48,81],"identify":[49],"several":[50],"bias":[51],"results":[52,130],"from":[53,69],"these":[54],"approaches":[55],"called":[56],"\"shrinked":[58],"kernel\".":[59],"Specifically,":[60],"it":[61],"refers":[62],"decrease":[65],"accuracy":[67],"resulting":[68],"an":[70],"output":[71],"that":[72,132],"overly":[73],"favors":[74],"kernel.":[77],"In":[78],"this":[79],"paper,":[80],"propose":[82],"new":[84],"approach":[85],"named":[86],"Expand":[87],"Kernel":[88],"Network":[89],"(EK-Net)":[90],"with":[91],"expand":[92],"kernel":[93],"distance":[94],"compensate":[96],"previous":[99],"deficiency,":[100],"which":[101],"includes":[102],"three-stages":[103],"regression":[104],"complete":[106],"instance":[107],"detection.":[108],"Moreover,":[109],"EK-Net":[110,133],"not":[111],"only":[112],"realize":[113],"precise":[115],"positioning":[116],"text,":[119],"but":[120],"also":[121],"achieve":[122],"trade-off":[124],"between":[125],"performance":[126,138],"speed.":[128],"Evaluation":[129],"demonstrate":[131],"achieves":[134],"state-of-the-art":[135],"or":[136],"competitive":[137],"compared":[139],"other":[141],"advanced":[142],"methods,":[143],"e.g.,":[144],"F-measure":[145,154],"85.72%":[147],"at":[148,157],"35.42":[149],"FPS":[150,159],"on":[151,160],"ICDAR":[152],"2015,":[153],"85.75%":[156],"40.13":[158],"CTW1500.":[161]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
