{"id":"https://openalex.org/W2101842906","doi":"https://doi.org/10.1109/icdar.2015.7333965","title":"OCR for bilingual documents using language modeling","display_name":"OCR for bilingual documents using language modeling","publication_year":2015,"publication_date":"2015-08-01","ids":{"openalex":"https://openalex.org/W2101842906","doi":"https://doi.org/10.1109/icdar.2015.7333965","mag":"2101842906"},"language":"en","primary_location":{"id":"doi:10.1109/icdar.2015.7333965","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdar.2015.7333965","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 13th International Conference on Document Analysis and Recognition (ICDAR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009175236","display_name":"Anupama Ray","orcid":"https://orcid.org/0000-0002-9193-5017"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Anupama Ray","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology, Delhi","Department of Electrical Engineering Indian Institute of Technology Delhi, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology, Delhi","institution_ids":["https://openalex.org/I68891433"]},{"raw_affiliation_string":"Department of Electrical Engineering Indian Institute of Technology Delhi, India","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041629023","display_name":"Sai Rajeswar","orcid":null},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sai Rajeswar","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology, Delhi","Department of Electrical Engineering Indian Institute of Technology Delhi, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology, Delhi","institution_ids":["https://openalex.org/I68891433"]},{"raw_affiliation_string":"Department of Electrical Engineering Indian Institute of Technology Delhi, India","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086242686","display_name":"Santanu Chaudhury","orcid":"https://orcid.org/0000-0002-5488-7773"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Santanu Chaudhury","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology, Delhi","Department of Electrical Engineering Indian Institute of Technology Delhi, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology, Delhi","institution_ids":["https://openalex.org/I68891433"]},{"raw_affiliation_string":"Department of Electrical Engineering Indian Institute of Technology Delhi, India","institution_ids":["https://openalex.org/I68891433"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5009175236"],"corresponding_institution_ids":["https://openalex.org/I68891433"],"apc_list":null,"apc_paid":null,"fwci":0.7364,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.79071053,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"1","issue":null,"first_page":"1256","last_page":"1260"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8849778771400452},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7393099665641785},{"id":"https://openalex.org/keywords/scripting-language","display_name":"Scripting language","score":0.7297738790512085},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.6633957624435425},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6530964374542236},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5987732410430908},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5245859026908875},{"id":"https://openalex.org/keywords/telugu","display_name":"Telugu","score":0.5048449635505676},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.499431848526001},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4945497214794159},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.48070961236953735},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.4656065106391907},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3780697286128998}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8849778771400452},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7393099665641785},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.7297738790512085},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.6633957624435425},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6530964374542236},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5987732410430908},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5245859026908875},{"id":"https://openalex.org/C2778756302","wikidata":"https://www.wikidata.org/wiki/Q8097","display_name":"Telugu","level":2,"score":0.5048449635505676},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.499431848526001},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4945497214794159},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.48070961236953735},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.4656065106391907},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3780697286128998},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icdar.2015.7333965","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdar.2015.7333965","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 13th International Conference on Document Analysis and Recognition (ICDAR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7200000286102295}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W61757119","https://openalex.org/W1614298861","https://openalex.org/W1985258458","https://openalex.org/W1997674818","https://openalex.org/W2022075901","https://openalex.org/W2061088043","https://openalex.org/W2061436640","https://openalex.org/W2079735306","https://openalex.org/W2083941131","https://openalex.org/W2104888441","https://openalex.org/W2106089090","https://openalex.org/W2110699760","https://openalex.org/W2113459411","https://openalex.org/W2114326232","https://openalex.org/W2115542396","https://openalex.org/W2120854963","https://openalex.org/W2126109012","https://openalex.org/W2127319406","https://openalex.org/W2128060444","https://openalex.org/W2130872173","https://openalex.org/W2149940198","https://openalex.org/W2154942898","https://openalex.org/W2167898728","https://openalex.org/W2171928131","https://openalex.org/W2402268235","https://openalex.org/W2474824677","https://openalex.org/W2950577311","https://openalex.org/W6636510571","https://openalex.org/W6675773814","https://openalex.org/W6676984168","https://openalex.org/W6684575925","https://openalex.org/W6720877245"],"related_works":["https://openalex.org/W2538934695","https://openalex.org/W2164215946","https://openalex.org/W2120407907","https://openalex.org/W2016860631","https://openalex.org/W4312133738","https://openalex.org/W2253106576","https://openalex.org/W2895456681","https://openalex.org/W4289422041","https://openalex.org/W2064096728","https://openalex.org/W2113687551"],"abstract_inverted_index":{"Script":[0],"based":[1],"features":[2,26],"are":[3,13,121],"highly":[4],"discriminative":[5],"for":[6,34,50,67,103,123,169],"text":[7,81,112],"segmentation":[8,120],"and":[9,83,99,119,150,159,174,178],"recognition.":[10,126],"Thus":[11],"they":[12],"widely":[14],"used":[15],"in":[16,57],"Optical":[17],"Character":[18],"Recognition(OCR)":[19],"problems.":[20],"But":[21,53,127],"usage":[22],"of":[23,30,59,96,125,172],"script":[24,38,77],"dependent":[25],"restricts":[27],"the":[28,54,85,161],"adaptation":[29],"such":[31,116],"architectures":[32],"directly":[33],"another":[35],"script.":[36],"With":[37],"independent":[39],"systems,":[40],"this":[41,140,167],"problem":[42,55],"can":[43],"be":[44],"solved":[45],"to":[46,71,111,135,155],"a":[47,68,76,93,152],"certain":[48],"extent":[49],"monolingual":[51],"documents.":[52],"aggravates":[56],"case":[58],"multilingual":[60],"documents":[61,177],"as":[62,117,147],"it":[63],"is":[64,88],"very":[65],"difficult":[66],"single":[69,184],"classifier":[70,87],"learn":[72],"many":[73],"scripts.":[74],"Generally":[75],"identification":[78],"module":[79],"identifies":[80],"segments":[82],"accordingly":[84],"script-dependent":[86],"selected.":[89],"This":[90],"paper":[91,141],"presents":[92],"unified":[94],"framework":[95],"language":[97,153],"model":[98,154],"multiple":[100,144],"preprocessing":[101,114,145],"hypotheses":[102,149],"word":[104,170],"recognition":[105,137,171,181],"from":[106],"bilingual":[107,176],"document":[108],"images.":[109],"Prior":[110],"recognition,":[113],"steps":[115,129],"binarization":[118],"required":[122],"ease":[124],"these":[128],"induce":[130],"huge":[131],"combinatorial":[132],"error":[133],"propagating":[134],"final":[136],"accuracy.":[138],"In":[139],"we":[142],"use":[143,151],"routines":[146],"alternate":[148],"verify":[156],"each":[157],"alternative":[158],"choose":[160],"best":[162],"recognized":[163],"sequence.":[164],"We":[165],"test":[166],"architecture":[168],"Kannada-English":[173],"Telugu-English":[175],"achieved":[179],"better":[180],"rates":[182],"than":[183],"methods":[185],"using":[186],"same":[187],"classifier.":[188]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":3},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
