{"id":"https://openalex.org/W2061088043","doi":"https://doi.org/10.1109/nlpke.2010.5587781","title":"Realization of a high performance bilingual OCR system for Thai-English printed documents","display_name":"Realization of a high performance bilingual OCR system for Thai-English printed documents","publication_year":2010,"publication_date":"2010-08-01","ids":{"openalex":"https://openalex.org/W2061088043","doi":"https://doi.org/10.1109/nlpke.2010.5587781","mag":"2061088043"},"language":"en","primary_location":{"id":"doi:10.1109/nlpke.2010.5587781","is_oa":false,"landing_page_url":"https://doi.org/10.1109/nlpke.2010.5587781","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 6th International Conference on Natural Language Processing and Knowledge Engineering(NLPKE-2010)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066276856","display_name":"Supachai Tangwongsan","orcid":null},"institutions":[{"id":"https://openalex.org/I25399158","display_name":"Mahidol University","ror":"https://ror.org/01znkr924","country_code":"TH","type":"education","lineage":["https://openalex.org/I25399158"]}],"countries":["TH"],"is_corresponding":true,"raw_author_name":"Supachai Tangwongsan","raw_affiliation_strings":["Faculty of Information and Communication Technology, Mahidol University, Bangkok, Thailand","Faculty of Information and Communication Technology, Mahidol University, Bangkok Thailand"],"affiliations":[{"raw_affiliation_string":"Faculty of Information and Communication Technology, Mahidol University, Bangkok, Thailand","institution_ids":["https://openalex.org/I25399158"]},{"raw_affiliation_string":"Faculty of Information and Communication Technology, Mahidol University, Bangkok Thailand","institution_ids":["https://openalex.org/I25399158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053833953","display_name":"Buntida Suvacharakulton","orcid":null},"institutions":[{"id":"https://openalex.org/I25399158","display_name":"Mahidol University","ror":"https://ror.org/01znkr924","country_code":"TH","type":"education","lineage":["https://openalex.org/I25399158"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Buntida Suvacharakulton","raw_affiliation_strings":["Faculty of Information and Communication Technology, Mahidol University, Bangkok, Thailand","Faculty of Information and Communication Technology, Mahidol University, Bangkok Thailand"],"affiliations":[{"raw_affiliation_string":"Faculty of Information and Communication Technology, Mahidol University, Bangkok, Thailand","institution_ids":["https://openalex.org/I25399158"]},{"raw_affiliation_string":"Faculty of Information and Communication Technology, Mahidol University, Bangkok Thailand","institution_ids":["https://openalex.org/I25399158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5066276856"],"corresponding_institution_ids":["https://openalex.org/I25399158"],"apc_list":null,"apc_paid":null,"fwci":0.3187,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.60025442,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8128328323364258},{"id":"https://openalex.org/keywords/extractor","display_name":"Extractor","score":0.7472234964370728},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6008067727088928},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6005370616912842},{"id":"https://openalex.org/keywords/realization","display_name":"Realization (probability)","score":0.5663387179374695},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5253649950027466},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.47216957807540894},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.45451802015304565},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3885115385055542},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3495251536369324},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.16388210654258728},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08087235689163208},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07455241680145264}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8128328323364258},{"id":"https://openalex.org/C117978034","wikidata":"https://www.wikidata.org/wiki/Q5422192","display_name":"Extractor","level":2,"score":0.7472234964370728},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6008067727088928},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6005370616912842},{"id":"https://openalex.org/C2781089630","wikidata":"https://www.wikidata.org/wiki/Q21856745","display_name":"Realization (probability)","level":2,"score":0.5663387179374695},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5253649950027466},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.47216957807540894},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.45451802015304565},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3885115385055542},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3495251536369324},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.16388210654258728},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08087235689163208},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07455241680145264},{"id":"https://openalex.org/C21880701","wikidata":"https://www.wikidata.org/wiki/Q2144042","display_name":"Process engineering","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/nlpke.2010.5587781","is_oa":false,"landing_page_url":"https://doi.org/10.1109/nlpke.2010.5587781","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 6th International Conference on Natural Language Processing and Knowledge Engineering(NLPKE-2010)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.800000011920929}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1979012001","https://openalex.org/W2110909944","https://openalex.org/W2119076929","https://openalex.org/W2120854963","https://openalex.org/W2126109012","https://openalex.org/W2130650159","https://openalex.org/W2133926179","https://openalex.org/W2142553359","https://openalex.org/W2171411755","https://openalex.org/W2285084126","https://openalex.org/W4285719527","https://openalex.org/W6679881841","https://openalex.org/W6685096043","https://openalex.org/W6695715505"],"related_works":["https://openalex.org/W2022544890","https://openalex.org/W2394097730","https://openalex.org/W1979583797","https://openalex.org/W2953302367","https://openalex.org/W2945706271","https://openalex.org/W4387435415","https://openalex.org/W2114169842","https://openalex.org/W2535808783","https://openalex.org/W3183408266","https://openalex.org/W1941834444"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,56,60,95,134,180,187],"high":[4],"performance":[5],"bilingual":[6,170,196],"OCR":[7],"system":[8,130,153,184],"for":[9,39,120],"printed":[10,139],"Thai":[11,21,161],"and":[12,22,59,72,144,167],"English":[13,23,165],"text.":[14],"With":[15],"the":[16,25,45,52,63,66,77,86,91,107,129,148,152,173,176,183],"complex":[17],"nature":[18],"of":[19,47,84,97,114,136,158,190],"both":[20],"languages,":[24],"first":[26],"stage":[27,43,109,178],"is":[28,44,70,131],"to":[29,101,111,118,193],"identify":[30],"languages":[31],"within":[32],"different":[33],"zones":[34],"by":[35,90,133],"using":[36],"geometric":[37],"properties":[38],"differentiation.":[40],"The":[41],"second":[42],"process":[46],"character":[48,68],"recognition,":[49],"in":[50,81,123,141,160,164,169,195],"which":[51],"technique":[53],"developed":[54],"includes":[55],"feature":[57,64],"extractor":[58],"classifier.":[61],"In":[62,175],"extraction,":[65],"thinned":[67],"image":[69],"analyzed":[71],"categorized":[73],"into":[74],"groups.":[75],"Next,":[76],"classifier":[78],"will":[79],"take":[80],"two":[82],"steps":[83],"recognition:":[85],"coarse":[87],"level,":[88],"followed":[89],"fine":[92],"level":[93],"with":[94,138,179],"guide":[96],"decision":[98],"trees.":[99],"As":[100],"obtain":[102,155],"an":[103,124,156],"even":[104],"better":[105,188],"result,":[106],"final":[108,177],"attempts":[110],"make":[112],"use":[113],"dictionary":[115,181],"look-up":[116],"as":[117,198],"check":[119],"accuracy":[121,157,189],"improvement":[122,191],"overall":[125],"performance.":[126],"For":[127],"verification,":[128],"tested":[132],"series":[135],"experiments":[137],"documents":[140,171,197],"141":[142],"pages":[143],"over":[145],"280,000":[146],"characters,":[147],"result":[149],"shows":[150],"that":[151],"could":[154,185],"100%":[159],"monolingual,":[162,166],"98.18%":[163],"99.85%":[168],"on":[172],"average.":[174],"look-up,":[182],"yield":[186],"up":[192],"99.98%":[194],"expected.":[199]},"counts_by_year":[{"year":2015,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
