{"id":"https://openalex.org/W4309969848","doi":"https://doi.org/10.1109/ictc55196.2022.9952873","title":"Improving Scene Text Recognition With A Combinative Image Augmentation Approach","display_name":"Improving Scene Text Recognition With A Combinative Image Augmentation Approach","publication_year":2022,"publication_date":"2022-10-19","ids":{"openalex":"https://openalex.org/W4309969848","doi":"https://doi.org/10.1109/ictc55196.2022.9952873"},"language":"en","primary_location":{"id":"doi:10.1109/ictc55196.2022.9952873","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ictc55196.2022.9952873","pdf_url":null,"source":{"id":"https://openalex.org/S4363607740","display_name":"2022 13th International Conference on Information and Communication Technology Convergence (ICTC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 13th International Conference on Information and Communication Technology Convergence (ICTC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000328387","display_name":"Ngan-Linh Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]}],"countries":["VN"],"is_corresponding":true,"raw_author_name":"Ngan-Linh Nguyen","raw_affiliation_strings":["University of Information Technology,Faculty of Information Science and Engineering,Ho Chi Minh City,Vietnam","Vietnam National University, Ho Chi Minh City, Vietnam","Faculty of Information Science and Engineering, University of Information Technology, Ho Chi Minh City, Vietnam"],"affiliations":[{"raw_affiliation_string":"University of Information Technology,Faculty of Information Science and Engineering,Ho Chi Minh City,Vietnam","institution_ids":[]},{"raw_affiliation_string":"Vietnam National University, Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]},{"raw_affiliation_string":"Faculty of Information Science and Engineering, University of Information Technology, Ho Chi Minh City, Vietnam","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019114663","display_name":"Gia-Huy Lam","orcid":null},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Gia-Huy Lam","raw_affiliation_strings":["University of Information Technology,Faculty of Information Science and Engineering,Ho Chi Minh City,Vietnam","Faculty of Information Science and Engineering, University of Information Technology, Ho Chi Minh City, Vietnam","Vietnam National University, Ho Chi Minh City, Vietnam"],"affiliations":[{"raw_affiliation_string":"University of Information Technology,Faculty of Information Science and Engineering,Ho Chi Minh City,Vietnam","institution_ids":[]},{"raw_affiliation_string":"Faculty of Information Science and Engineering, University of Information Technology, Ho Chi Minh City, Vietnam","institution_ids":[]},{"raw_affiliation_string":"Vietnam National University, Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077300267","display_name":"Hoang-Thong Vo","orcid":null},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Hoang-Thong Vo","raw_affiliation_strings":["University of Information Technology,Faculty of Information Science and Engineering,Ho Chi Minh City,Vietnam","Vietnam National University, Ho Chi Minh City, Vietnam","Faculty of Information Science and Engineering, University of Information Technology, Ho Chi Minh City, Vietnam"],"affiliations":[{"raw_affiliation_string":"University of Information Technology,Faculty of Information Science and Engineering,Ho Chi Minh City,Vietnam","institution_ids":[]},{"raw_affiliation_string":"Vietnam National University, Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]},{"raw_affiliation_string":"Faculty of Information Science and Engineering, University of Information Technology, Ho Chi Minh City, Vietnam","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012674107","display_name":"Trong-Hop Do","orcid":"https://orcid.org/0000-0001-5997-4983"},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Trong-Hop Do","raw_affiliation_strings":["University of Information Technology,Faculty of Information Science and Engineering,Ho Chi Minh City,Vietnam","Vietnam National University, Ho Chi Minh City, Vietnam","Faculty of Information Science and Engineering, University of Information Technology, Ho Chi Minh City, Vietnam"],"affiliations":[{"raw_affiliation_string":"University of Information Technology,Faculty of Information Science and Engineering,Ho Chi Minh City,Vietnam","institution_ids":[]},{"raw_affiliation_string":"Vietnam National University, Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]},{"raw_affiliation_string":"Faculty of Information Science and Engineering, University of Information Technology, Ho Chi Minh City, Vietnam","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079575997","display_name":"Anh-Tien Tran","orcid":"https://orcid.org/0000-0003-4533-7451"},"institutions":[{"id":"https://openalex.org/I67900169","display_name":"Chung-Ang University","ror":"https://ror.org/01r024a98","country_code":"KR","type":"education","lineage":["https://openalex.org/I67900169"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Anh-Tien Tran","raw_affiliation_strings":["School of Computer Science and Engineering, Chung-Ang University,Seoul,South Korea","School of Computer Science and Engineering, Chung-Ang University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Chung-Ang University,Seoul,South Korea","institution_ids":["https://openalex.org/I67900169"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Chung-Ang University, Seoul, South Korea","institution_ids":["https://openalex.org/I67900169"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5041978875","display_name":"Sungrae Cho","orcid":"https://orcid.org/0000-0003-1879-688X"},"institutions":[{"id":"https://openalex.org/I67900169","display_name":"Chung-Ang University","ror":"https://ror.org/01r024a98","country_code":"KR","type":"education","lineage":["https://openalex.org/I67900169"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sungrae Cho","raw_affiliation_strings":["School of Computer Science and Engineering, Chung-Ang University,Seoul,South Korea","School of Computer Science and Engineering, Chung-Ang University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Chung-Ang University,Seoul,South Korea","institution_ids":["https://openalex.org/I67900169"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Chung-Ang University, Seoul, South Korea","institution_ids":["https://openalex.org/I67900169"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5000328387"],"corresponding_institution_ids":["https://openalex.org/I123565023"],"apc_list":null,"apc_paid":null,"fwci":0.06,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.29530871,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"abs 2106 6960","issue":null,"first_page":"1051","last_page":"1055"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8246526122093201},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6650652289390564},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.6519352793693542},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5635011196136475},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5597852468490601},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.49555718898773193},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.48762455582618713},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4681207239627838},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35434579849243164},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33795657753944397}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8246526122093201},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6650652289390564},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.6519352793693542},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5635011196136475},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5597852468490601},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.49555718898773193},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.48762455582618713},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4681207239627838},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35434579849243164},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33795657753944397},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ictc55196.2022.9952873","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ictc55196.2022.9952873","pdf_url":null,"source":{"id":"https://openalex.org/S4363607740","display_name":"2022 13th International Conference on Information and Communication Technology Convergence (ICTC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 13th International Conference on Information and Communication Technology Convergence (ICTC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","score":0.6899999976158142,"display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1922126009","https://openalex.org/W1971822075","https://openalex.org/W1988461287","https://openalex.org/W2061802763","https://openalex.org/W2144554289","https://openalex.org/W2146835493","https://openalex.org/W2343052201","https://openalex.org/W2873558679","https://openalex.org/W2965066169","https://openalex.org/W2998382406","https://openalex.org/W3003336019","https://openalex.org/W3003642782","https://openalex.org/W3004846386","https://openalex.org/W3013262970","https://openalex.org/W3034414401","https://openalex.org/W3035449864","https://openalex.org/W3035682737","https://openalex.org/W3184557382","https://openalex.org/W3200351427","https://openalex.org/W3204479434","https://openalex.org/W3213619440","https://openalex.org/W3215143946","https://openalex.org/W4226329156","https://openalex.org/W6775038058"],"related_works":["https://openalex.org/W2519676117","https://openalex.org/W2218202131","https://openalex.org/W84108837","https://openalex.org/W2155740880","https://openalex.org/W2131713426","https://openalex.org/W4253249845","https://openalex.org/W2125452230","https://openalex.org/W2148444631","https://openalex.org/W1826068234","https://openalex.org/W2304716576"],"abstract_inverted_index":{"Scene":[0],"text":[1,43,85],"recognition":[2,66,86],"plays":[3],"an":[4,171,191],"important":[5],"role":[6],"in":[7,31,101,167,173],"various":[8],"intelligent":[9],"systems":[10,21],"today":[11],"such":[12],"as":[13],"robotic":[14],"process":[15],"automation":[16],"and":[17,54,74,94,145,169,181,199],"self-driving":[18],"cars.":[19],"These":[20],"require":[22],"knowledge":[23],"of":[24,37,49,62,91,142,193],"the":[25,29,32,47,59,63,65,80,89,99,102,136,140,154,164,174,185,188,196,202],"surrounding":[26],"scenery,":[27],"where":[28],"words":[30],"scene":[33,42,84],"hold":[34],"a":[35,92,116,150],"lot":[36],"valuable":[38],"information.":[39],"For":[40],"instance,":[41],"recognitions":[44],"can":[45],"serve":[46],"development":[48],"smart":[50,52],"tourism,":[51],"museums,":[53],"self-propelled":[55],"robots.":[56],"To":[57],"increase":[58,163],"practical":[60],"applicability":[61],"solution,":[64],"model":[67,175,198],"needs":[68],"to":[69,161],"meet":[70],"efficiently":[71],"both":[72,179],"accuracies":[73],"processing":[75],"time.":[76],"However,":[77],"before":[78],"constructing":[79],"model,":[81],"most":[82],"existing":[83],"frameworks":[87],"underrate":[88],"importance":[90],"reliable":[93],"well-served":[95],"augmentation":[96,109,118,123],"stage,":[97],"all":[98,157],"images":[100,168],"dataset":[103],"are":[104],"often":[105],"applied":[106],"with":[107],"common":[108],"functions.":[110],"In":[111,134],"this":[112],"paper,":[113],"we":[114],"present":[115],"combinative":[117],"framework":[119,137,186],"that":[120],"takes":[121],"random":[122],"functions":[124,143],"from":[125],"different":[126],"types":[127],"into":[128],"combinations":[129],"for":[130,149],"each":[131],"individual":[132],"image.":[133,155],"addition,":[135],"also":[138],"randomizes":[139],"number":[141],"taken":[144],"every":[146],"specific":[147],"parameter":[148],"particular":[151],"function":[152],"on":[153,178,195,201],"Thus,":[156],"these":[158],"tweaks":[159],"help":[160],"greatly":[162],"pattern":[165],"diversity":[166],"pose":[170],"improvement":[172],"evaluation.":[176],"Evaluated":[177],"seen":[180],"unseen":[182],"test":[183],"datasets,":[184],"increased":[187],"accuracy":[189],"by":[190],"average":[192],"5,02%":[194],"NRTR":[197],"2.36%":[200],"VietOCR":[203],"model.":[204]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
