{"id":"https://openalex.org/W4404915910","doi":"https://doi.org/10.1109/scisisis61014.2024.10759989","title":"Handwritten Character String Recognition Using Transformer and CNN Features","display_name":"Handwritten Character String Recognition Using Transformer and CNN Features","publication_year":2024,"publication_date":"2024-11-09","ids":{"openalex":"https://openalex.org/W4404915910","doi":"https://doi.org/10.1109/scisisis61014.2024.10759989"},"language":"en","primary_location":{"id":"doi:10.1109/scisisis61014.2024.10759989","is_oa":false,"landing_page_url":"https://doi.org/10.1109/scisisis61014.2024.10759989","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 Joint 13th International Conference on Soft Computing and Intelligent Systems and 25th International Symposium on Advanced Intelligent Systems (SCIS&amp;amp;ISIS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114957369","display_name":"Shunya Rakuka","orcid":null},"institutions":[{"id":"https://openalex.org/I178574317","display_name":"Mie University","ror":"https://ror.org/01529vy56","country_code":"JP","type":"education","lineage":["https://openalex.org/I178574317"]},{"id":"https://openalex.org/I4210128676","display_name":"Human Computer Interaction (Switzerland)","ror":"https://ror.org/036dv6j71","country_code":"CH","type":"company","lineage":["https://openalex.org/I4210128676"]}],"countries":["CH","JP"],"is_corresponding":true,"raw_author_name":"Shunya Rakuka","raw_affiliation_strings":["Mie University,Human Computer Interaction Lab"],"affiliations":[{"raw_affiliation_string":"Mie University,Human Computer Interaction Lab","institution_ids":["https://openalex.org/I4210128676","https://openalex.org/I178574317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040874965","display_name":"Kento Morita","orcid":"https://orcid.org/0000-0002-7171-8197"},"institutions":[{"id":"https://openalex.org/I4210128676","display_name":"Human Computer Interaction (Switzerland)","ror":"https://ror.org/036dv6j71","country_code":"CH","type":"company","lineage":["https://openalex.org/I4210128676"]},{"id":"https://openalex.org/I178574317","display_name":"Mie University","ror":"https://ror.org/01529vy56","country_code":"JP","type":"education","lineage":["https://openalex.org/I178574317"]}],"countries":["CH","JP"],"is_corresponding":false,"raw_author_name":"Kento Morita","raw_affiliation_strings":["Mie University,Human Computer Interaction Lab"],"affiliations":[{"raw_affiliation_string":"Mie University,Human Computer Interaction Lab","institution_ids":["https://openalex.org/I4210128676","https://openalex.org/I178574317"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111490360","display_name":"Tetsushi Wakabayashi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210128676","display_name":"Human Computer Interaction (Switzerland)","ror":"https://ror.org/036dv6j71","country_code":"CH","type":"company","lineage":["https://openalex.org/I4210128676"]},{"id":"https://openalex.org/I178574317","display_name":"Mie University","ror":"https://ror.org/01529vy56","country_code":"JP","type":"education","lineage":["https://openalex.org/I178574317"]}],"countries":["CH","JP"],"is_corresponding":false,"raw_author_name":"Tetsushi Wakabayashi","raw_affiliation_strings":["Mie University,Human Computer Interaction Lab"],"affiliations":[{"raw_affiliation_string":"Mie University,Human Computer Interaction Lab","institution_ids":["https://openalex.org/I4210128676","https://openalex.org/I178574317"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5114957369"],"corresponding_institution_ids":["https://openalex.org/I178574317","https://openalex.org/I4210128676"],"apc_list":null,"apc_paid":null,"fwci":0.5248,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.67927019,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9624999761581421,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9620000123977661,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/character-recognition","display_name":"Character recognition","score":0.7342883348464966},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7076631784439087},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6874023675918579},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5989491939544678},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5409094095230103},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5407872200012207},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.5032348036766052},{"id":"https://openalex.org/keywords/intelligent-word-recognition","display_name":"Intelligent word recognition","score":0.4860137403011322},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.46689924597740173},{"id":"https://openalex.org/keywords/intelligent-character-recognition","display_name":"Intelligent character recognition","score":0.3710264563560486},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.158189594745636},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14513570070266724},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11116358637809753},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.0878286361694336}],"concepts":[{"id":"https://openalex.org/C2987247673","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Character recognition","level":3,"score":0.7342883348464966},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7076631784439087},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6874023675918579},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5989491939544678},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5409094095230103},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5407872200012207},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.5032348036766052},{"id":"https://openalex.org/C17649283","wikidata":"https://www.wikidata.org/wiki/Q6044162","display_name":"Intelligent word recognition","level":5,"score":0.4860137403011322},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.46689924597740173},{"id":"https://openalex.org/C44868376","wikidata":"https://www.wikidata.org/wiki/Q3099089","display_name":"Intelligent character recognition","level":4,"score":0.3710264563560486},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.158189594745636},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14513570070266724},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11116358637809753},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0878286361694336},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/scisisis61014.2024.10759989","is_oa":false,"landing_page_url":"https://doi.org/10.1109/scisisis61014.2024.10759989","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 Joint 13th International Conference on Soft Computing and Intelligent Systems and 25th International Symposium on Advanced Intelligent Systems (SCIS&amp;amp;ISIS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2194187530","https://openalex.org/W2810983211","https://openalex.org/W2963517393","https://openalex.org/W2963526661","https://openalex.org/W2967615747","https://openalex.org/W3003642782","https://openalex.org/W3094502228","https://openalex.org/W4304014014","https://openalex.org/W4312233877","https://openalex.org/W4382202677","https://openalex.org/W4385245566","https://openalex.org/W4394625882","https://openalex.org/W6679436768","https://openalex.org/W6741742085","https://openalex.org/W6793890502"],"related_works":["https://openalex.org/W2218402054","https://openalex.org/W4309724674","https://openalex.org/W2811459303","https://openalex.org/W2576806841","https://openalex.org/W2110452885","https://openalex.org/W2553283597","https://openalex.org/W2424456397","https://openalex.org/W2765918780","https://openalex.org/W2096434575","https://openalex.org/W2574457628"],"abstract_inverted_index":{"While":[0],"character":[1,28,42,74,82,148,155,173],"recognition":[2,14,30,76],"systems":[3],"applications":[4],"with":[5,106],"restrictions":[6],"on":[7],"writing":[8],"conditions,":[9],"such":[10],"as":[11],"zip":[12],"code":[13],"and":[15,34,57,86,129,134,159],"ledger":[16],"sheet":[17],"recognition,":[18,150],"are":[19,36,44,59],"in":[20,65],"practical":[21],"use,":[22],"the":[23,117,120,141,152],"accuracy":[24],"of":[25,53,96,110,119,154,168],"free":[26,40],"handwritten":[27,41,73],"string":[29,75,149],"is":[31,144,157,161],"still":[32],"low":[33],"there":[35,58],"many":[37],"challenges.":[38],"Japanese":[39,50,147],"strings":[43,156],"difficult":[45,162],"to":[46,163],"segment":[47],"because":[48],"some":[49],"characters":[51],"consist":[52],"multiple":[54],"connected":[55],"components":[56],"no":[60],"spaces":[61],"between":[62],"words.":[63],"Therefore,":[64],"this":[66],"study,":[67],"we":[68],"propose":[69],"a":[70,93,107,165],"method":[71,77,102,122,143],"for":[72,146,171],"that":[78,140],"does":[79],"not":[80],"require":[81,92],"segmentation":[83],"using":[84],"Transformer":[85],"CNN":[87],"features.":[88],"Transformer-based":[89],"models":[90],"usually":[91],"large":[94,158],"amount":[95,109],"annotated":[97,111],"training":[98,112,169],"data.":[99,113],"However,":[100],"our":[101],"can":[103],"be":[104],"trained":[105],"small":[108],"Comparative":[114],"experiments":[115],"confirm":[116],"effectiveness":[118],"proposed":[121,142],"by":[123],"achieving":[124],"CER=O.127":[125],"while":[126],"CRNN":[127],"[1]":[128],"TrOCR":[130],"[2]":[131],"achieve":[132],"CER=O.562":[133],"CER=O.174,":[135],"respectively.":[136],"The":[137],"results":[138],"show":[139],"effective":[145],"where":[151],"variety":[153],"it":[160],"secure":[164],"sufficient":[166],"number":[167],"samples":[170],"each":[172],"string.":[174]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
