{"id":"https://openalex.org/W4382562143","doi":"https://doi.org/10.23919/mipro57284.2023.10159700","title":"An Overview of State-of-the-art Solutions for Scene Text Detection","display_name":"An Overview of State-of-the-art Solutions for Scene Text Detection","publication_year":2023,"publication_date":"2023-05-22","ids":{"openalex":"https://openalex.org/W4382562143","doi":"https://doi.org/10.23919/mipro57284.2023.10159700"},"language":"en","primary_location":{"id":"doi:10.23919/mipro57284.2023.10159700","is_oa":false,"landing_page_url":"http://dx.doi.org/10.23919/mipro57284.2023.10159700","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 46th MIPRO ICT and Electronics Convention (MIPRO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109618725","display_name":"Mladen D\u017eida","orcid":null},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":true,"raw_author_name":"Mladen D\u017eida","raw_affiliation_strings":["University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia"],"affiliations":[{"raw_affiliation_string":"University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","institution_ids":["https://openalex.org/I181343428"]},{"raw_affiliation_string":"Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062965196","display_name":"Davor Vukadin","orcid":"https://orcid.org/0000-0003-3309-6718"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Davor Vukadin","raw_affiliation_strings":["University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia"],"affiliations":[{"raw_affiliation_string":"University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","institution_ids":["https://openalex.org/I181343428"]},{"raw_affiliation_string":"Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052566827","display_name":"Marin \u0160ili\u0107","orcid":"https://orcid.org/0000-0002-4896-7689"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Marin \u0160ili\u0107","raw_affiliation_strings":["University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia"],"affiliations":[{"raw_affiliation_string":"University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","institution_ids":["https://openalex.org/I181343428"]},{"raw_affiliation_string":"Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062293489","display_name":"Goran Dela\u010d","orcid":"https://orcid.org/0000-0001-5315-8387"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Goran Dela\u010d","raw_affiliation_strings":["University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia"],"affiliations":[{"raw_affiliation_string":"University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","institution_ids":["https://openalex.org/I181343428"]},{"raw_affiliation_string":"Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024279611","display_name":"Klemo Vladimir","orcid":"https://orcid.org/0000-0002-6764-8851"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Klemo Vladimir","raw_affiliation_strings":["University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia"],"affiliations":[{"raw_affiliation_string":"University of Zagreb,Faculty of Electrical Engineering and Computing,Zagreb,Croatia","institution_ids":["https://openalex.org/I181343428"]},{"raw_affiliation_string":"Faculty of Electrical Engineering and Computing, University of Zagreb, Zagreb, Croatia","institution_ids":["https://openalex.org/I181343428"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5109618725"],"corresponding_institution_ids":["https://openalex.org/I181343428"],"apc_list":null,"apc_paid":null,"fwci":0.2456,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.50668681,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"947","last_page":"952"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7838989496231079},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7524977922439575},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.6907422542572021},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6681205034255981},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6671434044837952},{"id":"https://openalex.org/keywords/text-detection","display_name":"Text detection","score":0.6207224130630493},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5638719201087952},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4854012429714203},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.4634646475315094},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.45360904932022095},{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.45269566774368286},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.4451966881752014},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4320793151855469},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.4121493101119995},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4104350209236145},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.36251312494277954},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3475834131240845},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3332933783531189},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10793182253837585}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7838989496231079},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7524977922439575},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.6907422542572021},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6681205034255981},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6671434044837952},{"id":"https://openalex.org/C2983589003","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text detection","level":3,"score":0.6207224130630493},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5638719201087952},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4854012429714203},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.4634646475315094},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.45360904932022095},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.45269566774368286},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.4451966881752014},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4320793151855469},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.4121493101119995},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4104350209236145},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.36251312494277954},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3475834131240845},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3332933783531189},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10793182253837585},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/mipro57284.2023.10159700","is_oa":false,"landing_page_url":"http://dx.doi.org/10.23919/mipro57284.2023.10159700","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 46th MIPRO ICT and Electronics Convention (MIPRO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W2144554289","https://openalex.org/W2339589954","https://openalex.org/W2464918637","https://openalex.org/W2519818067","https://openalex.org/W2550687635","https://openalex.org/W2604735854","https://openalex.org/W2605076167","https://openalex.org/W2725486421","https://openalex.org/W2784050770","https://openalex.org/W2810028092","https://openalex.org/W2902494497","https://openalex.org/W2922690896","https://openalex.org/W2962804639","https://openalex.org/W2962810613","https://openalex.org/W2963647456","https://openalex.org/W2963840241","https://openalex.org/W2963977642","https://openalex.org/W2964294787","https://openalex.org/W2965512000","https://openalex.org/W2991626090","https://openalex.org/W2998621280","https://openalex.org/W3035222584","https://openalex.org/W3082397598","https://openalex.org/W3102695566","https://openalex.org/W3154615938","https://openalex.org/W4292962408","https://openalex.org/W4299729124","https://openalex.org/W6719590338","https://openalex.org/W6739844568","https://openalex.org/W6760673939"],"related_works":["https://openalex.org/W4237171675","https://openalex.org/W3036286480","https://openalex.org/W4287027631","https://openalex.org/W3192357901","https://openalex.org/W2387360586","https://openalex.org/W2952736415","https://openalex.org/W3209723314","https://openalex.org/W3205398323","https://openalex.org/W2883297582","https://openalex.org/W4390524233"],"abstract_inverted_index":{"Scene":[0],"text":[1,8,73,75,81,97],"detection":[2,98],"is":[3,53],"a":[4,17,23,105],"task":[5,69],"of":[6,25,37,49,61,92],"identifying":[7],"regions":[9],"and":[10,28,43,83,116],"labeling":[11],"them":[12],"with":[13,111],"bounding":[14],"boxes":[15],"in":[16],"complex":[18,57,78],"background.":[19],"It":[20],"has":[21,29],"received":[22],"lot":[24],"attention":[26],"recently":[27],"become":[30],"far":[31],"from":[32],"unsolvable":[33],"due":[34,45],"to":[35,46,55,113],"progress":[36],"deep":[38],"learning":[39],"for":[40,95],"computer":[41,50],"vision":[42],"also":[44],"rapid":[47],"development":[48],"hardware":[51],"which":[52],"able":[54],"process":[56],"neural":[58],"networks.":[59],"Some":[60],"the":[62],"most":[63],"common":[64],"challenges":[65],"that":[66],"make":[67],"this":[68],"difficult":[70],"are":[71],"irregular":[72],"shapes,":[74],"interferences,":[76],"very":[77],"background,":[79],"different":[80],"sizes":[82],"low":[84],"image":[85],"quality.":[86],"This":[87],"paper":[88],"presents":[89],"an":[90],"overview":[91],"state-of-the-art":[93],"solutions":[94,110],"scene":[96],"where":[99],"ICDAR":[100],"2015":[101],"was":[102],"used":[103],"as":[104],"benchmark":[106],"dataset.":[107],"We":[108],"compare":[109],"respect":[112],"precision,":[114],"recall":[115],"F-score.":[117]},"counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2025-12-24T23:09:58.560324","created_date":"2025-10-10T00:00:00"}
