{"id":"https://openalex.org/W4312412113","doi":"https://doi.org/10.1109/iscas48785.2022.9937519","title":"Anime Character Recognition using Intermediate Features Aggregation","display_name":"Anime Character Recognition using Intermediate Features Aggregation","publication_year":2022,"publication_date":"2022-05-28","ids":{"openalex":"https://openalex.org/W4312412113","doi":"https://doi.org/10.1109/iscas48785.2022.9937519"},"language":"en","primary_location":{"id":"doi:10.1109/iscas48785.2022.9937519","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscas48785.2022.9937519","pdf_url":null,"source":{"id":"https://openalex.org/S4363604393","display_name":"2022 IEEE International Symposium on Circuits and Systems (ISCAS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Symposium on Circuits and Systems (ISCAS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087804607","display_name":"Edwin Arkel Rios","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Edwin Arkel Rios","raw_affiliation_strings":["National Yang Ming Chiao Tung University,Hsinchu,Taiwan","National Yang Ming Chiao Tung University, Hsinchu, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,Hsinchu,Taiwan","institution_ids":["https://openalex.org/I148366613"]},{"raw_affiliation_string":"National Yang Ming Chiao Tung University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029298215","display_name":"Min\u2010Chun Hu","orcid":"https://orcid.org/0000-0003-1917-2155"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Min-Chun Hu","raw_affiliation_strings":["National Tsing Hua University,Hsinchu,Taiwan","National Tsing Hua University, Hsinchu, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Tsing Hua University,Hsinchu,Taiwan","institution_ids":["https://openalex.org/I25846049"]},{"raw_affiliation_string":"National Tsing Hua University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013913342","display_name":"Bo\u2010Cheng Lai","orcid":"https://orcid.org/0000-0002-9729-5196"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Bo-Cheng Lai","raw_affiliation_strings":["National Yang Ming Chiao Tung University,Hsinchu,Taiwan","National Yang Ming Chiao Tung University, Hsinchu, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,Hsinchu,Taiwan","institution_ids":["https://openalex.org/I148366613"]},{"raw_affiliation_string":"National Yang Ming Chiao Tung University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5087804607"],"corresponding_institution_ids":["https://openalex.org/I148366613"],"apc_list":null,"apc_paid":null,"fwci":0.4198,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.71217738,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"424","last_page":"428"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/anime","display_name":"Anime","score":0.8168004155158997},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8027533292770386},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5763382315635681},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5646743178367615},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.5056953430175781},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.5017039775848389},{"id":"https://openalex.org/keywords/animation","display_name":"Animation","score":0.45414280891418457},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.4450942277908325},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.42278623580932617},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.373546838760376},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3503868579864502},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.0969996452331543},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.07973763346672058},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07898163795471191}],"concepts":[{"id":"https://openalex.org/C118130439","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Anime","level":2,"score":0.8168004155158997},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8027533292770386},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5763382315635681},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5646743178367615},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.5056953430175781},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.5017039775848389},{"id":"https://openalex.org/C502989409","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Animation","level":2,"score":0.45414280891418457},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.4450942277908325},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.42278623580932617},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.373546838760376},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3503868579864502},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0969996452331543},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.07973763346672058},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07898163795471191},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscas48785.2022.9937519","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscas48785.2022.9937519","pdf_url":null,"source":{"id":"https://openalex.org/S4363604393","display_name":"2022 IEEE International Symposium on Circuits and Systems (ISCAS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Symposium on Circuits and Systems (ISCAS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309618","display_name":"Ministry of Science and Technology","ror":"https://ror.org/02b207r52"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1507108851","https://openalex.org/W1811750039","https://openalex.org/W2194775991","https://openalex.org/W2622263826","https://openalex.org/W2747543643","https://openalex.org/W2777662428","https://openalex.org/W2796108585","https://openalex.org/W2896457183","https://openalex.org/W2955425717","https://openalex.org/W2963649420","https://openalex.org/W2963784525","https://openalex.org/W2963959597","https://openalex.org/W2964280909","https://openalex.org/W3016895900","https://openalex.org/W3094502228","https://openalex.org/W3104636952","https://openalex.org/W3126792443","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3162926177","https://openalex.org/W3170874841","https://openalex.org/W4206706211","https://openalex.org/W4297736277","https://openalex.org/W4308831279","https://openalex.org/W4385245566","https://openalex.org/W6638214083","https://openalex.org/W6687483927","https://openalex.org/W6726983090","https://openalex.org/W6739622702","https://openalex.org/W6739901393","https://openalex.org/W6742838202","https://openalex.org/W6747381837","https://openalex.org/W6750964650","https://openalex.org/W6752574294","https://openalex.org/W6755207826","https://openalex.org/W6756444276","https://openalex.org/W6762718338","https://openalex.org/W6763509872","https://openalex.org/W6775930461","https://openalex.org/W6784333009","https://openalex.org/W6788135285","https://openalex.org/W6788556936","https://openalex.org/W6789753369","https://openalex.org/W6795288823"],"related_works":["https://openalex.org/W4241725891","https://openalex.org/W2075421999","https://openalex.org/W592941694","https://openalex.org/W2098776115","https://openalex.org/W4247978692","https://openalex.org/W4296571029","https://openalex.org/W2378422373","https://openalex.org/W3091774296","https://openalex.org/W4289597193","https://openalex.org/W2500902696"],"abstract_inverted_index":{"In":[0],"this":[1],"work":[2,19],"we":[3,119],"study":[4],"the":[5,37,52,71,124,139,142],"problem":[6],"of":[7,40,87,126,146],"anime":[8,77],"character":[9,78],"recognition.":[10,79],"Anime,":[11],"refers":[12],"to":[13,62,105],"animation":[14],"produced":[15],"within":[16],"Japan":[17],"and":[18,51,92,136],"derived":[20],"or":[21],"inspired":[22],"from":[23],"it.":[24],"We":[25,80,96],"propose":[26],"a":[27,85],"novel":[28],"Intermediate":[29],"Features":[30],"Aggregation":[31],"classification":[32,53,58,88],"head,":[33,54],"which":[34],"helps":[35],"smooth":[36],"optimization":[38],"landscape":[39],"Vision":[41],"Transformers":[42],"(ViTs)":[43],"by":[44,60],"adding":[45],"skip":[46],"connections":[47],"between":[48],"intermediate":[49],"layers":[50],"thereby":[55],"improving":[56],"relative":[57],"accuracy":[59],"up":[61],"28%.":[63],"The":[64],"proposed":[65],"model,":[66],"named":[67],"as":[68,130],"Animesion,":[69],"is":[70],"first":[72],"end-to-end":[73],"framework":[74],"for":[75,110],"large-scale":[76],"conduct":[81],"extensive":[82],"experiments":[83],"using":[84],"variety":[86],"models,":[89],"including":[90],"CNNs":[91],"self-attention":[93],"based":[94],"ViTs.":[95],"also":[97],"adapt":[98],"its":[99],"multimodal":[100,114],"variation":[101],"Vision-Language":[102],"Transformer":[103],"(ViLT),":[104],"incorporate":[106],"external":[107],"tag":[108],"data":[109],"classification,":[111],"without":[112],"additional":[113],"pre-training.":[115],"Through":[116],"our":[117],"results":[118],"obtain":[120],"new":[121],"insights":[122],"into":[123],"effects":[125],"how":[127],"hyperparameters":[128],"such":[129],"input":[131],"sequence":[132],"length,":[133],"mini-batch":[134],"size,":[135],"variations":[137],"on":[138],"architecture,":[140],"affect":[141],"transfer":[143],"learning":[144],"performance":[145],"Vi(L)Ts.":[147]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
