{"id":"https://openalex.org/W4220863108","doi":"https://doi.org/10.1587/transinf.2021edp7166","title":"Recursive Multi-Scale Channel-Spatial Attention for Fine-Grained Image Classification","display_name":"Recursive Multi-Scale Channel-Spatial Attention for Fine-Grained Image Classification","publication_year":2022,"publication_date":"2022-02-28","ids":{"openalex":"https://openalex.org/W4220863108","doi":"https://doi.org/10.1587/transinf.2021edp7166"},"language":"en","primary_location":{"id":"doi:10.1587/transinf.2021edp7166","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2021edp7166","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E105.D/3/E105.D_2021EDP7166/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://www.jstage.jst.go.jp/article/transinf/E105.D/3/E105.D_2021EDP7166/_pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037611716","display_name":"Dichao LIU","orcid":null},"institutions":[{"id":"https://openalex.org/I60134161","display_name":"Nagoya University","ror":"https://ror.org/04chrp450","country_code":"JP","type":"education","lineage":["https://openalex.org/I60134161"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Dichao LIU","raw_affiliation_strings":["Graduate School of Informatics, Nagoya University"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Nagoya University","institution_ids":["https://openalex.org/I60134161"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100445098","display_name":"Yu Wang","orcid":"https://orcid.org/0000-0001-7959-3387"},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yu WANG","raw_affiliation_strings":["College of Information Science and Engineering, Ritsumeikan University"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ritsumeikan University","institution_ids":["https://openalex.org/I135768898"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111458376","display_name":"Kenji Mase","orcid":null},"institutions":[{"id":"https://openalex.org/I60134161","display_name":"Nagoya University","ror":"https://ror.org/04chrp450","country_code":"JP","type":"education","lineage":["https://openalex.org/I60134161"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kenji MASE","raw_affiliation_strings":["Graduate School of Informatics, Nagoya University"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Nagoya University","institution_ids":["https://openalex.org/I60134161"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080180020","display_name":"Jien Kato","orcid":"https://orcid.org/0000-0002-0196-4405"},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Jien KATO","raw_affiliation_strings":["College of Information Science and Engineering, Ritsumeikan University"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ritsumeikan University","institution_ids":["https://openalex.org/I135768898"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5037611716"],"corresponding_institution_ids":["https://openalex.org/I60134161"],"apc_list":null,"apc_paid":null,"fwci":1.5092,"has_fulltext":true,"cited_by_count":16,"citation_normalized_percentile":{"value":0.83281774,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"E105.D","issue":"3","first_page":"713","last_page":"726"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8729187250137329},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8620778322219849},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6493391394615173},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5969894528388977},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5949597358703613},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.5725171566009521},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5611091256141663},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5582037568092346},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.5122148394584656},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5090591311454773},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.48565709590911865},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.46519243717193604},{"id":"https://openalex.org/keywords/spatial-analysis","display_name":"Spatial analysis","score":0.4159199595451355},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33062589168548584},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.06210163235664368}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8729187250137329},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8620778322219849},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6493391394615173},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5969894528388977},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5949597358703613},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.5725171566009521},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5611091256141663},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5582037568092346},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.5122148394584656},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5090591311454773},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.48565709590911865},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.46519243717193604},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.4159199595451355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33062589168548584},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.06210163235664368},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1587/transinf.2021edp7166","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2021edp7166","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E105.D/3/E105.D_2021EDP7166/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1587/transinf.2021edp7166","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2021edp7166","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E105.D/3/E105.D_2021EDP7166/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.75,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4220863108.pdf","grobid_xml":"https://content.openalex.org/works/W4220863108.grobid-xml"},"referenced_works_count":51,"referenced_works":["https://openalex.org/W56385144","https://openalex.org/W1496650988","https://openalex.org/W1596562677","https://openalex.org/W1686810756","https://openalex.org/W1836465849","https://openalex.org/W1849277567","https://openalex.org/W1928906481","https://openalex.org/W1955942245","https://openalex.org/W1980526845","https://openalex.org/W2039507552","https://openalex.org/W2064675550","https://openalex.org/W2097117768","https://openalex.org/W2108598243","https://openalex.org/W2110015572","https://openalex.org/W2125283600","https://openalex.org/W2138011018","https://openalex.org/W2194775991","https://openalex.org/W2202499615","https://openalex.org/W2289708887","https://openalex.org/W2462457117","https://openalex.org/W2479109623","https://openalex.org/W2518108298","https://openalex.org/W2579318141","https://openalex.org/W2737725206","https://openalex.org/W2752782242","https://openalex.org/W2761785940","https://openalex.org/W2765268259","https://openalex.org/W2884585870","https://openalex.org/W2891951760","https://openalex.org/W2895340641","https://openalex.org/W2895361760","https://openalex.org/W2899771611","https://openalex.org/W2908347420","https://openalex.org/W2963150697","https://openalex.org/W2963393555","https://openalex.org/W2963407932","https://openalex.org/W2963855133","https://openalex.org/W3003792425","https://openalex.org/W3005359536","https://openalex.org/W3035367622","https://openalex.org/W3094502228","https://openalex.org/W3094897602","https://openalex.org/W3101590291","https://openalex.org/W3108870912","https://openalex.org/W3123272955","https://openalex.org/W3128999341","https://openalex.org/W3139434170","https://openalex.org/W3172917901","https://openalex.org/W3174336354","https://openalex.org/W3176285518","https://openalex.org/W4206192903"],"related_works":["https://openalex.org/W2952813363","https://openalex.org/W2911497689","https://openalex.org/W4360783045","https://openalex.org/W2129933262","https://openalex.org/W2963346891","https://openalex.org/W2770149305","https://openalex.org/W2972076240","https://openalex.org/W3167930666","https://openalex.org/W3014952856","https://openalex.org/W2964843961"],"abstract_inverted_index":{"Fine-grained":[0],"image":[1,70,152,163],"classification":[2,133],"is":[3,40,81,155,166],"a":[4,91,115],"difficult":[5],"problem,":[6],"and":[7,22,39,102,135,154],"previous":[8,66],"studies":[9],"mainly":[10],"overcome":[11],"this":[12,47,60,111],"problem":[13],"by":[14,83],"locating":[15,33],"multiple":[16],"discriminative":[17,34],"regions":[18,35],"in":[19,150],"different":[20],"scales":[21],"then":[23],"aggregating":[24],"complementary":[25,156],"information":[26,80],"explored":[27,82],"from":[28],"the":[29,51,63,78,86,132],"located":[30],"regions.":[31,109],"However,":[32,77],"introduces":[36],"heavy":[37],"overhead":[38],"not":[41],"suitable":[42],"for":[43,58,161],"real-world":[44],"application.":[45],"In":[46,110],"paper,":[48],"we":[49],"propose":[50],"recursive":[52],"multi-scale":[53,74,100],"channel-spatial":[54],"attention":[55,108,136,148],"module":[56,117],"(RMCSAM)":[57],"addressing":[59],"problem.":[61],"Following":[62],"experience":[64],"of":[65,90,106],"research":[67],"on":[68],"fine-grained":[69,151,162],"classification,":[71,153],"RMCSAM":[72,113,129,142],"explores":[73],"attentional":[75,79],"information.":[76],"recursively":[84],"refining":[85],"deep":[87],"feature":[88],"maps":[89],"convolutional":[92],"neural":[93],"network":[94],"(CNN)":[95],"to":[96,99,157],"better":[97,144],"correspond":[98],"channel-wise":[101],"spatial-wise":[103],"attention,":[104],"instead":[105],"localizing":[107],"way,":[112],"provides":[114],"lightweight":[116],"that":[118,128],"can":[119,130],"be":[120],"inserted":[121],"into":[122],"standard":[123],"CNNs.":[124],"Experimental":[125],"results":[126],"show":[127],"improve":[131],"accuracy":[134],"capturing":[137],"ability":[138],"over":[139],"baselines.":[140],"Also,":[141],"performs":[143],"than":[145],"other":[146],"state-of-the-art":[147,159],"modules":[149],"some":[158],"approaches":[160],"classification.":[164],"Code":[165],"available":[167],"at":[168],"https://github.com/Dichao-Liu/Recursive-Multi-Scale-Channel-Spatial-Attention-Module.":[169]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
