{"id":"https://openalex.org/W1997674818","doi":"https://doi.org/10.1145/2505377.2509977","title":"Multilingual OCR research and applications","display_name":"Multilingual OCR research and applications","publication_year":2013,"publication_date":"2013-08-24","ids":{"openalex":"https://openalex.org/W1997674818","doi":"https://doi.org/10.1145/2505377.2509977","mag":"1997674818"},"language":"en","primary_location":{"id":"doi:10.1145/2505377.2509977","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2505377.2509977","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 4th International Workshop on Multilingual OCR","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102329211","display_name":"Xujun Peng","orcid":"https://orcid.org/0000-0001-9373-7092"},"institutions":[{"id":"https://openalex.org/I1306686416","display_name":"RTX (United States)","ror":"https://ror.org/0354t7b78","country_code":"US","type":"company","lineage":["https://openalex.org/I1306686416"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xujun Peng","raw_affiliation_strings":["Raytheon BBN Technologies, Cambridge, MA","[Raytheon BBN Technologies, Cambridge, MA]"],"affiliations":[{"raw_affiliation_string":"Raytheon BBN Technologies, Cambridge, MA","institution_ids":["https://openalex.org/I1306686416"]},{"raw_affiliation_string":"[Raytheon BBN Technologies, Cambridge, MA]","institution_ids":["https://openalex.org/I1306686416"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108504544","display_name":"Huaigu Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I1306686416","display_name":"RTX (United States)","ror":"https://ror.org/0354t7b78","country_code":"US","type":"company","lineage":["https://openalex.org/I1306686416"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Huaigu Cao","raw_affiliation_strings":["Raytheon BBN Technologies, Cambridge, MA","[Raytheon BBN Technologies, Cambridge, MA]"],"affiliations":[{"raw_affiliation_string":"Raytheon BBN Technologies, Cambridge, MA","institution_ids":["https://openalex.org/I1306686416"]},{"raw_affiliation_string":"[Raytheon BBN Technologies, Cambridge, MA]","institution_ids":["https://openalex.org/I1306686416"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036052557","display_name":"Srirangaraj Setlur","orcid":"https://orcid.org/0000-0002-7118-9280"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Srirangaraj Setlur","raw_affiliation_strings":["CUBS, University at Buffalo, Buffalo, NY"],"affiliations":[{"raw_affiliation_string":"CUBS, University at Buffalo, Buffalo, NY","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020354604","display_name":"Venu Govindaraju","orcid":"https://orcid.org/0000-0002-5318-7409"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Venu Govindaraju","raw_affiliation_strings":["CUBS, University at Buffalo, Buffalo, NY"],"affiliations":[{"raw_affiliation_string":"CUBS, University at Buffalo, Buffalo, NY","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066184920","display_name":"Prem Natarajan","orcid":"https://orcid.org/0000-0002-4386-6651"},"institutions":[{"id":"https://openalex.org/I2801204180","display_name":"Marina Del Rey Hospital","ror":"https://ror.org/05wqyfz02","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I2801204180"]},{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Prem Natarajan","raw_affiliation_strings":["Univ. of Southern California, Marina del Rey, CA"],"affiliations":[{"raw_affiliation_string":"Univ. of Southern California, Marina del Rey, CA","institution_ids":["https://openalex.org/I2801204180","https://openalex.org/I1174212"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5102329211"],"corresponding_institution_ids":["https://openalex.org/I1306686416"],"apc_list":null,"apc_paid":null,"fwci":2.1772,"has_fulltext":false,"cited_by_count":27,"citation_normalized_percentile":{"value":0.88954871,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9797999858856201,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8521378040313721},{"id":"https://openalex.org/keywords/scripting-language","display_name":"Scripting language","score":0.7376111745834351},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.7140336632728577},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6619320511817932},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.594749391078949},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5842326879501343},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4735238552093506},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4727253317832947},{"id":"https://openalex.org/keywords/handwriting-recognition","display_name":"Handwriting recognition","score":0.4475305676460266},{"id":"https://openalex.org/keywords/handwriting","display_name":"Handwriting","score":0.4254497289657593},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.3184499740600586},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.08995851874351501}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8521378040313721},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.7376111745834351},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.7140336632728577},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6619320511817932},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.594749391078949},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5842326879501343},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4735238552093506},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4727253317832947},{"id":"https://openalex.org/C112640561","wikidata":"https://www.wikidata.org/wiki/Q2440634","display_name":"Handwriting recognition","level":3,"score":0.4475305676460266},{"id":"https://openalex.org/C2779386606","wikidata":"https://www.wikidata.org/wiki/Q2393642","display_name":"Handwriting","level":2,"score":0.4254497289657593},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3184499740600586},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08995851874351501},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2505377.2509977","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2505377.2509977","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 4th International Workshop on Multilingual OCR","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8500000238418579}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W13965504","https://openalex.org/W46134239","https://openalex.org/W102704617","https://openalex.org/W1491852184","https://openalex.org/W1544794770","https://openalex.org/W1968568012","https://openalex.org/W1995574284","https://openalex.org/W2001642682","https://openalex.org/W2012448972","https://openalex.org/W2015591846","https://openalex.org/W2025694764","https://openalex.org/W2028180100","https://openalex.org/W2038529276","https://openalex.org/W2044485638","https://openalex.org/W2050036944","https://openalex.org/W2055408294","https://openalex.org/W2061802763","https://openalex.org/W2068824048","https://openalex.org/W2076886798","https://openalex.org/W2077895339","https://openalex.org/W2080228837","https://openalex.org/W2081112606","https://openalex.org/W2091696127","https://openalex.org/W2093100897","https://openalex.org/W2096686108","https://openalex.org/W2098236080","https://openalex.org/W2100607392","https://openalex.org/W2103132709","https://openalex.org/W2104209319","https://openalex.org/W2106382161","https://openalex.org/W2106693967","https://openalex.org/W2114781615","https://openalex.org/W2116168999","https://openalex.org/W2120165255","https://openalex.org/W2125462973","https://openalex.org/W2127319406","https://openalex.org/W2132669457","https://openalex.org/W2133552271","https://openalex.org/W2135164809","https://openalex.org/W2135249422","https://openalex.org/W2137975285","https://openalex.org/W2143060414","https://openalex.org/W2146366522","https://openalex.org/W2146850796","https://openalex.org/W2147768505","https://openalex.org/W2148645152","https://openalex.org/W2149266633","https://openalex.org/W2149319679","https://openalex.org/W2149925729","https://openalex.org/W2163237111","https://openalex.org/W2163534337","https://openalex.org/W2164125420","https://openalex.org/W2164863177","https://openalex.org/W2170942820","https://openalex.org/W4229847583","https://openalex.org/W4242842265","https://openalex.org/W4256718973","https://openalex.org/W6604092412","https://openalex.org/W6669770651","https://openalex.org/W6669939159","https://openalex.org/W6884928307"],"related_works":["https://openalex.org/W143289143","https://openalex.org/W4200294382","https://openalex.org/W2943834649","https://openalex.org/W2108604059","https://openalex.org/W4377224118","https://openalex.org/W2158390728","https://openalex.org/W2598403525","https://openalex.org/W4312478864","https://openalex.org/W2182344861","https://openalex.org/W1990936625"],"abstract_inverted_index":{"This":[0,62,74],"paper":[1],"offers":[2],"an":[3,65],"overview":[4],"of":[5,14,49,68,72,87,114],"the":[6,12,31,47,84,94,122],"current":[7],"approaches":[8],"to":[9,34,40,55,83],"research":[10,69,115,127],"in":[11,89,101,116,121,128],"field":[13],"off-line":[15,19],"multilingual":[16,35,79,99,129],"OCR.":[17],"Typically,":[18],"OCR":[20,36,100,130],"systems":[21],"are":[22,119,131],"designed":[23],"for":[24,78,98,125],"a":[25,42,111],"particular":[26],"script":[27,105],"or":[28],"language.":[29],"However,":[30],"ideal":[32],"approach":[33],"would":[37],"likely":[38],"be":[39,53],"develop":[41],"system":[43],"that":[44],"can,":[45],"with":[46,59,70],"use":[48],"language-specific":[50],"training":[51],"data,":[52],"re-targeted":[54],"process":[56],"different":[57],"languages":[58],"minimal":[60],"modifications.":[61],"is":[63,75],"still":[64],"open":[66],"area":[67],"plenty":[71],"challenges.":[73],"particularly":[76],"true":[77],"handwriting":[80],"recognition":[81,108],"due":[82],"added":[85],"complexity":[86],"variations":[88],"writing":[90],"styles":[91],"even":[92],"within":[93],"same":[95],"scripts.":[96],"Challenges":[97],"preprocessing,":[102],"feature":[103],"extraction,":[104],"identification":[106],"and":[107,110],"modeling":[109],"brief":[112],"survey":[113],"these":[117],"areas":[118],"presented":[120],"paper.":[123],"Ideas":[124],"future":[126],"outlined.":[132]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":2},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
