{"id":"https://openalex.org/W4407451030","doi":"https://doi.org/10.1109/tpami.2025.3533737","title":"CCDPlus: Towards Accurate Character to Character Distillation for Text Recognition","display_name":"CCDPlus: Towards Accurate Character to Character Distillation for Text Recognition","publication_year":2025,"publication_date":"2025-02-13","ids":{"openalex":"https://openalex.org/W4407451030","doi":"https://doi.org/10.1109/tpami.2025.3533737","pmid":"https://pubmed.ncbi.nlm.nih.gov/40031846"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3533737","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3533737","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059748327","display_name":"Tongkun Guan","orcid":"https://orcid.org/0000-0003-3346-8315"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tongkun Guan","raw_affiliation_strings":["MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Wei Shen","orcid":"https://orcid.org/0000-0002-1235-598X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Shen","raw_affiliation_strings":["MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":null,"display_name":"Xiaokang Yang","orcid":"https://orcid.org/0000-0003-4029-3322"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaokang Yang","raw_affiliation_strings":["MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5059748327"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":1.2181,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.76009791,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"47","issue":"5","first_page":"3546","last_page":"3562"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9448000192642212,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9413999915122986,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.8852285146713257},{"id":"https://openalex.org/keywords/character-recognition","display_name":"Character recognition","score":0.7036150693893433},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6942986249923706},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6651654839515686},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.506622850894928},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5009379386901855},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.45971420407295227},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.45013606548309326},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4400981664657593},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4222294092178345},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12496289610862732},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.08751049637794495},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.06546124815940857}],"concepts":[{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.8852285146713257},{"id":"https://openalex.org/C2987247673","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Character recognition","level":3,"score":0.7036150693893433},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6942986249923706},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6651654839515686},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.506622850894928},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5009379386901855},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.45971420407295227},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.45013606548309326},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4400981664657593},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4222294092178345},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12496289610862732},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.08751049637794495},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.06546124815940857},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3533737","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3533737","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:40031846","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40031846","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6402690117","display_name":null,"funder_award_id":"62322604","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G81657677","display_name":null,"funder_award_id":"62176159","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":93,"referenced_works":["https://openalex.org/W1885185971","https://openalex.org/W1971822075","https://openalex.org/W1981283549","https://openalex.org/W1998042868","https://openalex.org/W2004767896","https://openalex.org/W2008806374","https://openalex.org/W2033404582","https://openalex.org/W2122221966","https://openalex.org/W2127141656","https://openalex.org/W2144554289","https://openalex.org/W2146835493","https://openalex.org/W2194187530","https://openalex.org/W2343052201","https://openalex.org/W2750938222","https://openalex.org/W2810983211","https://openalex.org/W2875814315","https://openalex.org/W2914492226","https://openalex.org/W2963299604","https://openalex.org/W2963470893","https://openalex.org/W2963526661","https://openalex.org/W2965066169","https://openalex.org/W2997749585","https://openalex.org/W2998382406","https://openalex.org/W3003642782","https://openalex.org/W3004846386","https://openalex.org/W3005436539","https://openalex.org/W3013224334","https://openalex.org/W3034414401","https://openalex.org/W3034447740","https://openalex.org/W3035449864","https://openalex.org/W3035524453","https://openalex.org/W3094502228","https://openalex.org/W3096739052","https://openalex.org/W3110267192","https://openalex.org/W3159481202","https://openalex.org/W3163005567","https://openalex.org/W3168428721","https://openalex.org/W3173990630","https://openalex.org/W3174746398","https://openalex.org/W3175618949","https://openalex.org/W3175855397","https://openalex.org/W3177684257","https://openalex.org/W3181186176","https://openalex.org/W3192495122","https://openalex.org/W3202415716","https://openalex.org/W3202912918","https://openalex.org/W3204778874","https://openalex.org/W3206615376","https://openalex.org/W3206651063","https://openalex.org/W3211070770","https://openalex.org/W4225562651","https://openalex.org/W4226329156","https://openalex.org/W4226374800","https://openalex.org/W4229030834","https://openalex.org/W4255788608","https://openalex.org/W4283805255","https://openalex.org/W4283819468","https://openalex.org/W4283821822","https://openalex.org/W4312298799","https://openalex.org/W4312804044","https://openalex.org/W4312843595","https://openalex.org/W4312879041","https://openalex.org/W4312923907","https://openalex.org/W4312932251","https://openalex.org/W4312965673","https://openalex.org/W4313045695","https://openalex.org/W4313156423","https://openalex.org/W4385767840","https://openalex.org/W4386065575","https://openalex.org/W4386410320","https://openalex.org/W4390463734","https://openalex.org/W4390754349","https://openalex.org/W4390871832","https://openalex.org/W4390872592","https://openalex.org/W4390873548","https://openalex.org/W4393148058","https://openalex.org/W4393148285","https://openalex.org/W4401024603","https://openalex.org/W4402716330","https://openalex.org/W4402754116","https://openalex.org/W4402772614","https://openalex.org/W4402961694","https://openalex.org/W4403791624","https://openalex.org/W4404002859","https://openalex.org/W4405399726","https://openalex.org/W6629590909","https://openalex.org/W6691603626","https://openalex.org/W6757817989","https://openalex.org/W6762573206","https://openalex.org/W6769908858","https://openalex.org/W6857461731","https://openalex.org/W6872424297","https://openalex.org/W6874369402"],"related_works":["https://openalex.org/W1991513203","https://openalex.org/W2892704491","https://openalex.org/W3178467699","https://openalex.org/W4312612713","https://openalex.org/W2106936331","https://openalex.org/W1985626581","https://openalex.org/W2042634493","https://openalex.org/W2100798736","https://openalex.org/W2728450881","https://openalex.org/W2481236784"],"abstract_inverted_index":{"Existing":[0],"scene":[1,115],"text":[2,116,129],"recognition":[3,20,117,200],"methods":[4,215],"leverage":[5],"large-scale":[6],"labeled":[7],"synthetic":[8],"data":[9,48,94,168],"(LSD)":[10],"to":[11,161],"reduce":[12],"reliance":[13],"on":[14,67,69,78,137,185,190,224,234],"labor-intensive":[15],"annotation":[16],"tasks":[17],"and":[18,37,96,122,197,213,222],"improve":[19],"capability":[21],"in":[22],"real-world":[23,174],"scenarios.":[24],"However,":[25],"the":[26,41,55,61,133,179,194,199,235],"emergence":[27],"of":[28,45,51,57,219],"a":[29,119,231],"synth-to-real":[30],"domain":[31,100,195],"gap":[32],"still":[33],"limits":[34],"their":[35],"efficiency":[36],"robustness.":[38],"Consequently,":[39],"harvesting":[40],"meaningful":[42],"intrinsic":[43],"qualities":[44],"unlabeled":[46],"real":[47],"(URD)":[49],"is":[50],"great":[52],"importance,":[53],"given":[54],"prevalence":[56],"text-laden":[58],"images.":[59],"Toward":[60],"target,":[62],"recent":[63],"efforts":[64],"have":[65],"focused":[66],"pre-training":[68],"URD":[70,138,186],"through":[71],"sequence-to-sequence":[72],"self-supervised":[73,123,183,214],"learning,":[74],"followed":[75],"by":[76,142,216],"fine-tuning":[77],"LSD":[79,147],"via":[80],"supervised":[81,121,188],"learning.":[82],"Nevertheless,":[83],"they":[84],"encounter":[85],"three":[86],"important":[87],"issues:":[88],"coarse":[89],"representation":[90,140],"learning":[91,124,184,189],"units,":[92],"inflexible":[93],"augmentation,":[95,169],"an":[97,109,217],"emerging":[98],"real-to-synth":[99],"drift.":[101],"To":[102],"overcome":[103],"these":[104],"challenges,":[105],"we":[106],"propose":[107],"CCDPlus,":[108],"accurate":[110],"character-to-character":[111,163],"distillation":[112,164],"method":[113],"for":[114,128],"with":[118,166,187],"joint":[120],"framework.":[125],"Specifically,":[126],"tailored":[127],"images,":[130],"CCDPlus":[131,160,206],"delineates":[132],"fine-grained":[134],"character":[135],"structures":[136],"as":[139],"units":[141],"transferring":[143],"knowledge":[144],"learned":[145],"from":[146],"online.":[148],"Without":[149],"requiring":[150],"extra":[151],"bounding":[152],"box":[153],"or":[154],"pixel-level":[155],"annotations,":[156],"this":[157],"process":[158],"allows":[159],"enable":[162],"flexibly":[165],"versatile":[167],"which":[170],"effectively":[171,192],"extracts":[172],"general":[173],"character-level":[175],"feature":[176],"representations.":[177],"Meanwhile,":[178],"unified":[180],"framework":[181],"combines":[182],"LSD,":[191],"solving":[193],"inconsistency":[196],"enhancing":[198],"performance.":[201],"Extensive":[202],"experiments":[203],"demonstrate":[204],"that":[205],"outperforms":[207],"previous":[208],"state-of-the-art":[209],"(SOTA)":[210],"supervised,":[211],"semi-supervised,":[212],"average":[218],"1.8%,":[220],"0.6%,":[221],"1.1%":[223],"standard":[225],"datasets,":[226],"respectively.":[227],"Additionally,":[228],"it":[229],"achieves":[230],"6.1%":[232],"improvement":[233],"more":[236],"challenging":[237],"Union14M-L":[238],"dataset.":[239]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
