{"id":"https://openalex.org/W3199031966","doi":"https://doi.org/10.1109/ijcnn52387.2021.9533713","title":"Regularizing CTC in Expectation-Maximization Framework with Application to Handwritten Text Recognition","display_name":"Regularizing CTC in Expectation-Maximization Framework with Application to Handwritten Text Recognition","publication_year":2021,"publication_date":"2021-07-18","ids":{"openalex":"https://openalex.org/W3199031966","doi":"https://doi.org/10.1109/ijcnn52387.2021.9533713","mag":"3199031966"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn52387.2021.9533713","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9533713","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017249233","display_name":"Likun Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Likun Gao","raw_affiliation_strings":["National Laboratory of Pattern Recognition (NLPR), Institution of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition (NLPR), Institution of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031674072","display_name":"Heng Zhang","orcid":"https://orcid.org/0000-0002-1093-5809"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heng Zhang","raw_affiliation_strings":["National Laboratory of Pattern Recognition (NLPR), Institution of Automation, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition (NLPR), Institution of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100714202","display_name":"Cheng\u2010Lin Liu","orcid":"https://orcid.org/0000-0002-6743-4175"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210097554","display_name":"Center for Excellence in Brain Science and Intelligence Technology","ror":"https://ror.org/00vpwhm04","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210097554"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng-Lin Liu","raw_affiliation_strings":["CAS Center for Excellence in Brain Science and Intelligence Technology, Beijing, China","National Laboratory of Pattern Recognition (NLPR), Institution of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"CAS Center for Excellence in Brain Science and Intelligence Technology, Beijing, China","institution_ids":["https://openalex.org/I4210097554"]},{"raw_affiliation_string":"National Laboratory of Pattern Recognition (NLPR), Institution of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5017249233"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210100255","https://openalex.org/I4210112150","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.5764,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.68527778,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8024474382400513},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.6939787268638611},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5936932563781738},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.5896764397621155},{"id":"https://openalex.org/keywords/expectation\u2013maximization-algorithm","display_name":"Expectation\u2013maximization algorithm","score":0.5847621560096741},{"id":"https://openalex.org/keywords/voting","display_name":"Voting","score":0.5694093704223633},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.5226397514343262},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5133673548698425},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.471731573343277},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4398728311061859},{"id":"https://openalex.org/keywords/majority-rule","display_name":"Majority rule","score":0.42648160457611084},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32403630018234253},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.22830399870872498},{"id":"https://openalex.org/keywords/maximum-likelihood","display_name":"Maximum likelihood","score":0.194926917552948},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0954938530921936}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8024474382400513},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.6939787268638611},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5936932563781738},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.5896764397621155},{"id":"https://openalex.org/C182081679","wikidata":"https://www.wikidata.org/wiki/Q1275153","display_name":"Expectation\u2013maximization algorithm","level":3,"score":0.5847621560096741},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.5694093704223633},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.5226397514343262},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5133673548698425},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.471731573343277},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4398728311061859},{"id":"https://openalex.org/C153668964","wikidata":"https://www.wikidata.org/wiki/Q27636","display_name":"Majority rule","level":2,"score":0.42648160457611084},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32403630018234253},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.22830399870872498},{"id":"https://openalex.org/C49781872","wikidata":"https://www.wikidata.org/wiki/Q1045555","display_name":"Maximum likelihood","level":2,"score":0.194926917552948},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0954938530921936},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn52387.2021.9533713","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9533713","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.4300000071525574}],"awards":[{"id":"https://openalex.org/G5996648377","display_name":null,"funder_award_id":"61936003,61721004","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8008905905","display_name":null,"funder_award_id":"2020AAA0109702","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W194242946","https://openalex.org/W1522301498","https://openalex.org/W1981367467","https://openalex.org/W2000145530","https://openalex.org/W2002342963","https://openalex.org/W2008164950","https://openalex.org/W2008225289","https://openalex.org/W2049633694","https://openalex.org/W2105518985","https://openalex.org/W2122585011","https://openalex.org/W2147393756","https://openalex.org/W2152928267","https://openalex.org/W2153182373","https://openalex.org/W2154070811","https://openalex.org/W2183341477","https://openalex.org/W2194187530","https://openalex.org/W2528751927","https://openalex.org/W2567948266","https://openalex.org/W2581377246","https://openalex.org/W2593572697","https://openalex.org/W2740767790","https://openalex.org/W2741436143","https://openalex.org/W2751748110","https://openalex.org/W2763095131","https://openalex.org/W2765407302","https://openalex.org/W2793404167","https://openalex.org/W2795619303","https://openalex.org/W2891267443","https://openalex.org/W2892209435","https://openalex.org/W2902521343","https://openalex.org/W2948210185","https://openalex.org/W2959965583","https://openalex.org/W2963517393","https://openalex.org/W2964099383","https://openalex.org/W2964121744","https://openalex.org/W2964612108","https://openalex.org/W2970206392","https://openalex.org/W2998382406","https://openalex.org/W3004391146","https://openalex.org/W4250589301","https://openalex.org/W4297798436","https://openalex.org/W6631190155","https://openalex.org/W6682488149","https://openalex.org/W6704241340","https://openalex.org/W6732696085","https://openalex.org/W6744179516","https://openalex.org/W6745136726","https://openalex.org/W6754576048","https://openalex.org/W6754747464"],"related_works":["https://openalex.org/W2103111323","https://openalex.org/W3121841074","https://openalex.org/W1976188970","https://openalex.org/W2055572829","https://openalex.org/W3036613766","https://openalex.org/W1894159578","https://openalex.org/W2807400035","https://openalex.org/W2889559465","https://openalex.org/W2990541822","https://openalex.org/W3125086856"],"abstract_inverted_index":{"Connectionist":[0],"Temporal":[1],"Classification":[2],"(CTC)":[3],"is":[4],"an":[5],"objective":[6],"function":[7],"for":[8],"sequence":[9],"learning":[10],"and":[11,18,60,92,117],"has":[12,26],"shown":[13],"promising":[14],"results":[15,120],"in":[16],"speech":[17],"text":[19,69,104],"recognition":[20,105],"tasks.":[21],"However,":[22],"its":[23],"inherent":[24],"mechanism":[25,96],"not":[27],"been":[28],"investigated":[29],"thoroughly.":[30],"In":[31],"this":[32],"paper,":[33],"we":[34,54],"propose":[35,55],"a":[36,56,94],"theoretical":[37],"explanation":[38],"of":[39,44,68,90,102],"CTC":[40,91,115],"from":[41],"the":[42,45,51,66,76,81,86,98,108,114],"perspective":[43],"Expectation-Maximization":[46],"(EM)":[47],"algorithm.":[48],"Based":[49],"on":[50,121],"EM":[52],"analysis,":[53],"pseudo-label-based":[57],"L1":[58,72],"regularization":[59,73],"voting":[61,82,95],"decoding":[62,83,88],"algorithm":[63,84],"to":[64,97],"improve":[65],"performance":[67],"recognition.":[70],"The":[71],"can":[74],"reduce":[75],"pseudo-label":[77],"estimation":[78],"error,":[79],"while":[80],"modifies":[85],"built-in":[87],"logic":[89],"introduces":[93],"inference":[99],"process.":[100],"Experiments":[101],"handwritten":[103],"show":[106],"that":[107],"proposed":[109],"method":[110],"consistently":[111],"improves":[112],"over":[113],"baseline":[116],"yields":[118],"state-of-the-art":[119],"three":[122],"benchmark":[123],"datasets.":[124]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
