{"id":"https://openalex.org/W4310113663","doi":"https://doi.org/10.1145/3568562.3568624","title":"Improving text recognition by combining visual and linguistic features of text","display_name":"Improving text recognition by combining visual and linguistic features of text","publication_year":2022,"publication_date":"2022-11-29","ids":{"openalex":"https://openalex.org/W4310113663","doi":"https://doi.org/10.1145/3568562.3568624"},"language":"en","primary_location":{"id":"doi:10.1145/3568562.3568624","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3568562.3568624","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 11th International Symposium on Information and Communication Technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067894717","display_name":"Cong Tran","orcid":"https://orcid.org/0000-0001-9467-4978"},"institutions":[{"id":"https://openalex.org/I4210095603","display_name":"Vietnam Posts and Telecommunications Group (Vietnam)","ror":"https://ror.org/00q0e7f94","country_code":"VN","type":"company","lineage":["https://openalex.org/I4210095603"]},{"id":"https://openalex.org/I4400600977","display_name":"Posts and Telecommunications Institute of Technology","ror":"https://ror.org/0363rtq22","country_code":null,"type":"education","lineage":["https://openalex.org/I4400600977"]}],"countries":["VN"],"is_corresponding":true,"raw_author_name":"Cong Tran","raw_affiliation_strings":["Posts and Telecommunications Institute of Technology, Viet Nam"],"raw_orcid":"https://orcid.org/0000-0001-9467-4978","affiliations":[{"raw_affiliation_string":"Posts and Telecommunications Institute of Technology, Viet Nam","institution_ids":["https://openalex.org/I4210095603","https://openalex.org/I4400600977"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014920897","display_name":"Khanh Nguyen-Trong","orcid":"https://orcid.org/0000-0001-5175-8805"},"institutions":[{"id":"https://openalex.org/I4210095603","display_name":"Vietnam Posts and Telecommunications Group (Vietnam)","ror":"https://ror.org/00q0e7f94","country_code":"VN","type":"company","lineage":["https://openalex.org/I4210095603"]},{"id":"https://openalex.org/I4400600977","display_name":"Posts and Telecommunications Institute of Technology","ror":"https://ror.org/0363rtq22","country_code":null,"type":"education","lineage":["https://openalex.org/I4400600977"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Khanh Nguyen-Trong","raw_affiliation_strings":["Posts and Telecommunications Institute of Technology, Viet Nam"],"raw_orcid":"https://orcid.org/0000-0001-5175-8805","affiliations":[{"raw_affiliation_string":"Posts and Telecommunications Institute of Technology, Viet Nam","institution_ids":["https://openalex.org/I4210095603","https://openalex.org/I4400600977"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062890024","display_name":"Cuong Pham","orcid":"https://orcid.org/0000-0003-0973-0889"},"institutions":[{"id":"https://openalex.org/I4210095603","display_name":"Vietnam Posts and Telecommunications Group (Vietnam)","ror":"https://ror.org/00q0e7f94","country_code":"VN","type":"company","lineage":["https://openalex.org/I4210095603"]},{"id":"https://openalex.org/I4400600977","display_name":"Posts and Telecommunications Institute of Technology","ror":"https://ror.org/0363rtq22","country_code":null,"type":"education","lineage":["https://openalex.org/I4400600977"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Cuong Pham","raw_affiliation_strings":["Posts and Telecommunications Institute of Technology, Viet Nam"],"raw_orcid":"https://orcid.org/0000-0003-0973-0889","affiliations":[{"raw_affiliation_string":"Posts and Telecommunications Institute of Technology, Viet Nam","institution_ids":["https://openalex.org/I4210095603","https://openalex.org/I4400600977"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049746327","display_name":"Dat Tran-Anh","orcid":"https://orcid.org/0000-0002-8924-4356"},"institutions":[{"id":"https://openalex.org/I4210095603","display_name":"Vietnam Posts and Telecommunications Group (Vietnam)","ror":"https://ror.org/00q0e7f94","country_code":"VN","type":"company","lineage":["https://openalex.org/I4210095603"]},{"id":"https://openalex.org/I4400600977","display_name":"Posts and Telecommunications Institute of Technology","ror":"https://ror.org/0363rtq22","country_code":null,"type":"education","lineage":["https://openalex.org/I4400600977"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Dat Tran-Anh","raw_affiliation_strings":["Posts and Telecommunications Institute of Technology, Viet Nam"],"raw_orcid":"https://orcid.org/0000-0002-8924-4356","affiliations":[{"raw_affiliation_string":"Posts and Telecommunications Institute of Technology, Viet Nam","institution_ids":["https://openalex.org/I4210095603","https://openalex.org/I4400600977"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061365021","display_name":"Tien Nguyen-Thi-Tan","orcid":"https://orcid.org/0000-0002-6300-336X"},"institutions":[{"id":"https://openalex.org/I4210115718","display_name":"Thai Nguyen University","ror":"https://ror.org/02128gy91","country_code":"VN","type":"education","lineage":["https://openalex.org/I4210115718"]},{"id":"https://openalex.org/I4401726905","display_name":"Thai Nguyen University of Medicine and Pharmacy","ror":"https://ror.org/053jkh992","country_code":null,"type":"education","lineage":["https://openalex.org/I4401726905"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Tien Nguyen-Thi-Tan","raw_affiliation_strings":["Thai Nguyen University of Medicine and Pharmacy, Viet Nam"],"raw_orcid":"https://orcid.org/0000-0002-6300-336X","affiliations":[{"raw_affiliation_string":"Thai Nguyen University of Medicine and Pharmacy, Viet Nam","institution_ids":["https://openalex.org/I4210115718","https://openalex.org/I4401726905"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5067894717"],"corresponding_institution_ids":["https://openalex.org/I4210095603","https://openalex.org/I4400600977"],"apc_list":null,"apc_paid":null,"fwci":0.2041,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.49567028,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"39","issue":null,"first_page":"329","last_page":"335"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9728000164031982,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8114562034606934},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.7860013842582703},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.7179533243179321},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7022064924240112},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6793097853660583},{"id":"https://openalex.org/keywords/vietnamese","display_name":"Vietnamese","score":0.6417780518531799},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.540073812007904},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5084030032157898},{"id":"https://openalex.org/keywords/text-recognition","display_name":"Text recognition","score":0.47582271695137024},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.4549621045589447},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.42335301637649536},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3685639500617981},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2951527535915375},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.17647665739059448}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8114562034606934},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.7860013842582703},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.7179533243179321},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7022064924240112},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6793097853660583},{"id":"https://openalex.org/C103621254","wikidata":"https://www.wikidata.org/wiki/Q9199","display_name":"Vietnamese","level":2,"score":0.6417780518531799},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.540073812007904},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5084030032157898},{"id":"https://openalex.org/C2983812711","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text recognition","level":3,"score":0.47582271695137024},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.4549621045589447},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.42335301637649536},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3685639500617981},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2951527535915375},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.17647665739059448},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3568562.3568624","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3568562.3568624","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 11th International Symposium on Information and Communication Technology","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8500000238418579,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W654550266","https://openalex.org/W2519818067","https://openalex.org/W2583381660","https://openalex.org/W2766343341","https://openalex.org/W2809468489","https://openalex.org/W2905096748","https://openalex.org/W2996221890","https://openalex.org/W2997154779","https://openalex.org/W3104953317","https://openalex.org/W3108280614","https://openalex.org/W3124381626","https://openalex.org/W3130456057","https://openalex.org/W3158057761","https://openalex.org/W3163650427","https://openalex.org/W3182680257","https://openalex.org/W3186819370","https://openalex.org/W3197877599","https://openalex.org/W4205269010","https://openalex.org/W4206353077","https://openalex.org/W4226396278","https://openalex.org/W4293558655","https://openalex.org/W4320148024"],"related_works":["https://openalex.org/W1991513203","https://openalex.org/W3178467699","https://openalex.org/W4306707571","https://openalex.org/W3179897446","https://openalex.org/W4309224528","https://openalex.org/W2970150031","https://openalex.org/W3211896491","https://openalex.org/W3153225109","https://openalex.org/W3163712264","https://openalex.org/W4362605793"],"abstract_inverted_index":{"While":[0],"being":[1],"studied":[2],"for":[3,45,53,111],"several":[4],"decades,":[5],"Optical":[6],"Character":[7],"Recognition":[8],"(OCR)":[9],"has":[10,47],"still":[11],"been":[12,49],"attracting":[13],"considerable":[14],"attention":[15],"from":[16],"researchers.":[17],"Previous":[18],"studies":[19],"tend":[20],"to":[21,35,62,106,129],"focus":[22],"on":[23,136],"visual":[24,72,113],"features":[25,75],"of":[26,66,76,84,115,149,155],"optical":[27,78],"texts,":[28],"such":[29],"as":[30],"texture,":[31],"shape,":[32],"and":[33,73,89,103,151],"color":[34],"build":[36],"OCR":[37,68,127],"models.":[38],"However,":[39],"linguistic":[40,74],"features,":[41],"an":[42,147],"important":[43],"factor":[44],"OCR,":[46],"not":[48],"extensively":[50],"investigated,":[51],"especially":[52],"Vietnamese-OCR":[54],"scanned":[55],"documents.":[56],"Therefore,":[57],"we":[58],"introduce":[59],"a":[60,86,91,137,152],"method":[61,82,120,145],"improve":[63],"the":[64,77,101,108,112,116,143],"performance":[65],"Vietnamese":[67],"by":[69],"combining":[70],"both":[71],"text.":[79,117],"The":[80],"proposed":[81,144],"consists":[83],"(i)":[85],"domain-specific":[87],"dictionary":[88],"(ii)":[90],"modified":[92],"natural":[93],"language":[94],"processing":[95],"model":[96],"termed":[97],"ABCNet,":[98],"employed":[99],"at":[100],"training":[102],"inference":[104],"step,":[105],"determine":[107],"best":[109],"candidate":[110],"appearance":[114],"Moreover,":[118],"our":[119],"can":[121],"easily":[122],"be":[123],"integrated":[124],"with":[125],"existing":[126],"methods":[128],"further":[130],"increase":[131],"their":[132],"performance.":[133],"Experimental":[134],"results":[135],"newly":[138],"collected":[139],"dataset":[140],"show":[141],"that":[142],"achieves":[146],"accuracy":[148],"83.61%":[150],"F1":[153],"score":[154],"84.1%.":[156]},"counts_by_year":[{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
