{"id":"https://openalex.org/W4404030313","doi":"https://doi.org/10.1109/icccnt61001.2024.10726007","title":"Deep Learning-Based Optical Character Recognition for Robust Real-World Conditions: A Comparative Analysis","display_name":"Deep Learning-Based Optical Character Recognition for Robust Real-World Conditions: A Comparative Analysis","publication_year":2024,"publication_date":"2024-06-24","ids":{"openalex":"https://openalex.org/W4404030313","doi":"https://doi.org/10.1109/icccnt61001.2024.10726007"},"language":"en","primary_location":{"id":"doi:10.1109/icccnt61001.2024.10726007","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icccnt61001.2024.10726007","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 15th International Conference on Computing Communication and Networking Technologies (ICCCNT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050784280","display_name":"Aniket Mishra","orcid":null},"institutions":[{"id":"https://openalex.org/I81556334","display_name":"Amrita Vishwa Vidyapeetham","ror":"https://ror.org/03am10p12","country_code":"IN","type":"education","lineage":["https://openalex.org/I81556334"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Aniket Mishra","raw_affiliation_strings":["Computer Science and Engineering Amrita Vishwa Vidyapeetham,Chennai,India"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering Amrita Vishwa Vidyapeetham,Chennai,India","institution_ids":["https://openalex.org/I81556334"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114515694","display_name":"Jayanta Sikdar","orcid":null},"institutions":[{"id":"https://openalex.org/I81556334","display_name":"Amrita Vishwa Vidyapeetham","ror":"https://ror.org/03am10p12","country_code":"IN","type":"education","lineage":["https://openalex.org/I81556334"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Jayanta Sikdar","raw_affiliation_strings":["Computer Science and Engineering Amrita Vishwa Vidyapeetham,Chennai,India"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering Amrita Vishwa Vidyapeetham,Chennai,India","institution_ids":["https://openalex.org/I81556334"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010379237","display_name":"Sandeep Kumar","orcid":"https://orcid.org/0000-0003-4125-4165"},"institutions":[{"id":"https://openalex.org/I81556334","display_name":"Amrita Vishwa Vidyapeetham","ror":"https://ror.org/03am10p12","country_code":"IN","type":"education","lineage":["https://openalex.org/I81556334"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"S Udhaya Kumar","raw_affiliation_strings":["Computer Science and Engineering Amrita Vishwa Vidyapeetham,Chennai,India"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering Amrita Vishwa Vidyapeetham,Chennai,India","institution_ids":["https://openalex.org/I81556334"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5050784280"],"corresponding_institution_ids":["https://openalex.org/I81556334"],"apc_list":null,"apc_paid":null,"fwci":1.3158,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.82321068,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9621999859809875,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9621999859809875,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6702536344528198},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.6085933446884155},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6074267029762268},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5368853807449341},{"id":"https://openalex.org/keywords/character-recognition","display_name":"Character recognition","score":0.5207121968269348},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.4432998597621918},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.391944020986557},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11205890774726868}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6702536344528198},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.6085933446884155},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6074267029762268},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5368853807449341},{"id":"https://openalex.org/C2987247673","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Character recognition","level":3,"score":0.5207121968269348},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.4432998597621918},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.391944020986557},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11205890774726868},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icccnt61001.2024.10726007","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icccnt61001.2024.10726007","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 15th International Conference on Computing Communication and Networking Technologies (ICCCNT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2015981126","https://openalex.org/W2940927814","https://openalex.org/W2970103342","https://openalex.org/W3035313607","https://openalex.org/W3045882047","https://openalex.org/W3092619036","https://openalex.org/W3111412136","https://openalex.org/W3125812125","https://openalex.org/W3207901375","https://openalex.org/W3216666189","https://openalex.org/W4205445027","https://openalex.org/W4213106045","https://openalex.org/W4307262224","https://openalex.org/W4379385788","https://openalex.org/W4382202677","https://openalex.org/W4394625882","https://openalex.org/W6769185743","https://openalex.org/W6798825125"],"related_works":["https://openalex.org/W1991513203","https://openalex.org/W2892704491","https://openalex.org/W3178467699","https://openalex.org/W4312612713","https://openalex.org/W2106936331","https://openalex.org/W1985626581","https://openalex.org/W2042634493","https://openalex.org/W2100798736","https://openalex.org/W2728450881","https://openalex.org/W2481236784"],"abstract_inverted_index":{"This":[0,100],"paper":[1],"offers":[2],"a":[3,31,77,117],"comprehensive":[4,118],"comparative":[5],"analysis":[6,52],"of":[7,61,74,120,135,197,203,224],"Optical":[8],"Character":[9],"Recognition":[10],"(OCR)":[11],"techniques,":[12],"spanning":[13],"from":[14],"traditional":[15],"methods":[16],"to":[17,91,140,156,172,185],"advanced":[18],"deep":[19,88],"learning":[20,205],"models":[21],"such":[22],"as":[23,30,103],"Transformers,":[24],"BERT,":[25,139],"and":[26,48,59,110,123,152,160,188,200,222],"Bi-LSTM.":[27],"OCR":[28,114,121,142,158,170,192,208,225],"serves":[29,102],"pivotal":[32],"tool":[33],"for":[34,84,107,207,216],"converting":[35],"printed":[36],"or":[37],"handwritten":[38],"text":[39,49,150],"into":[40,56,132],"digital":[41],"formats,":[42],"facilitating":[43],"applications":[44],"in":[45,68,113,147,191],"document":[46],"digitization":[47],"analysis.":[50],"Our":[51],"provides":[53],"valuable":[54],"insights":[55],"the":[57,72,133,141,195,201,219],"strengths":[58],"weaknesses":[60],"each":[62],"approach,":[63],"thereby":[64,177],"elucidating":[65],"their":[66,124,145,154,174],"practicality":[67],"real-world":[69],"scenarios.":[70],"In":[71],"domain":[73],"information":[75,199],"retrieval,":[76],"novel":[78],"approach":[79],"entails":[80],"leveraging":[81],"bidirectional":[82],"LSTM":[83],"semantic":[85],"search,":[86],"harnessing":[87],"neural":[89],"networks":[90],"comprehend":[92],"textual":[93],"content":[94],"nuances":[95],"beyond":[96],"mere":[97],"keyword":[98],"matching.":[99],"study":[101],"an":[104],"indispensable":[105],"resource":[106],"researchers,":[108],"practitioners,":[109],"developers":[111],"interested":[112],"technology,":[115],"furnishing":[116],"overview":[119],"techniques":[122,166],"applicability":[125],"across":[126,227],"various":[127],"domains.":[128,229],"Furthermore,":[129],"we":[130],"delve":[131],"adaptation":[134],"Transformer":[136],"models,":[137],"including":[138],"domain,":[143],"assessing":[144],"efficacy":[146],"handling":[148],"diverse":[149,228],"types":[151],"discussing":[153],"potential":[155],"enhance":[157],"accuracy":[159],"robustness.":[161],"We":[162],"also":[163],"explore":[164],"ensemble":[165],"that":[167],"amalgamate":[168],"multiple":[169],"approaches":[171],"exploit":[173],"complementary":[175],"strengths,":[176],"augmenting":[178],"overall":[179],"performance.":[180],"Moreover,":[181],"our":[182],"exploration":[183,202],"extends":[184],"emerging":[186],"trends":[187],"future":[189],"directions":[190],"research,":[193],"encompassing":[194],"integration":[196],"multimodal":[198],"self-supervised":[204],"paradigms":[206],"model":[209],"training.":[210],"These":[211],"advancements":[212],"hold":[213],"significant":[214],"promise":[215],"further":[217],"elevating":[218],"accuracy,":[220],"efficiency,":[221],"versatility":[223],"systems":[226]},"counts_by_year":[{"year":2025,"cited_by_count":5}],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
