{"id":"https://openalex.org/W7147384247","doi":"https://doi.org/10.1109/icvisp68610.2025.11451680","title":"Few-Shot Image Classification Algorithm Based on k-NN Attention Mechanism and Hierarchical Cascaded Transformer","display_name":"Few-Shot Image Classification Algorithm Based on k-NN Attention Mechanism and Hierarchical Cascaded Transformer","publication_year":2025,"publication_date":"2025-11-28","ids":{"openalex":"https://openalex.org/W7147384247","doi":"https://doi.org/10.1109/icvisp68610.2025.11451680"},"language":null,"primary_location":{"id":"doi:10.1109/icvisp68610.2025.11451680","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icvisp68610.2025.11451680","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 9th International Conference on Vision, Image and Signal Processing (ICVISP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090372699","display_name":"Chaoqi Song","orcid":null},"institutions":[{"id":"https://openalex.org/I4210136859","display_name":"Xi\u2019an University of Posts and Telecommunications","ror":"https://ror.org/04jn0td46","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210136859"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chaoqi Song","raw_affiliation_strings":["Xi&#x2019;an University of Posts and Telecommunications,School of Communication and Information Engineering,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an University of Posts and Telecommunications,School of Communication and Information Engineering,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I4210136859"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100430876","display_name":"Xi Zhang","orcid":"https://orcid.org/0000-0003-3415-5345"},"institutions":[{"id":"https://openalex.org/I4210136859","display_name":"Xi\u2019an University of Posts and Telecommunications","ror":"https://ror.org/04jn0td46","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210136859"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Zhang","raw_affiliation_strings":["Xi&#x2019;an University of Posts and Telecommunications,School of Communication and Information Engineering,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an University of Posts and Telecommunications,School of Communication and Information Engineering,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I4210136859"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132616606","display_name":"Yichen Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I119045251","display_name":"Huaqiao University","ror":"https://ror.org/03frdh605","country_code":"CN","type":"education","lineage":["https://openalex.org/I119045251"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yichen Wu","raw_affiliation_strings":["Huaqiao University,School of Computer Science and Technology,Xiamen,China"],"affiliations":[{"raw_affiliation_string":"Huaqiao University,School of Computer Science and Technology,Xiamen,China","institution_ids":["https://openalex.org/I119045251"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132691320","display_name":"Yu Hao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210136859","display_name":"Xi\u2019an University of Posts and Telecommunications","ror":"https://ror.org/04jn0td46","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210136859"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu Hao","raw_affiliation_strings":["Xi&#x2019;an University of Posts and Telecommunications,School of Communication and Information Engineering,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an University of Posts and Telecommunications,School of Communication and Information Engineering,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I4210136859"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102512772","display_name":"Jixiang Du","orcid":null},"institutions":[{"id":"https://openalex.org/I119045251","display_name":"Huaqiao University","ror":"https://ror.org/03frdh605","country_code":"CN","type":"education","lineage":["https://openalex.org/I119045251"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jixiang Du","raw_affiliation_strings":["Huaqiao University,School of Computer Science and Technology,Xiamen,China"],"affiliations":[{"raw_affiliation_string":"Huaqiao University,School of Computer Science and Technology,Xiamen,China","institution_ids":["https://openalex.org/I119045251"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5090372699"],"corresponding_institution_ids":["https://openalex.org/I4210136859"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.87527987,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.5126000046730042,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.5126000046730042,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.09309999644756317,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.07180000096559525,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.5983999967575073},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5625},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.5293999910354614},{"id":"https://openalex.org/keywords/separable-space","display_name":"Separable space","score":0.5166000127792358},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5112000107765198},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.48649999499320984},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4059999883174896},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.38769999146461487}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6848000288009644},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.5983999967575073},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5625},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5504000186920166},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.5293999910354614},{"id":"https://openalex.org/C70710897","wikidata":"https://www.wikidata.org/wiki/Q680081","display_name":"Separable space","level":2,"score":0.5166000127792358},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5112000107765198},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.48649999499320984},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.48579999804496765},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4059999883174896},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.38769999146461487},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.37599998712539673},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3643999993801117},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.3474000096321106},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3343000113964081},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.32839998602867126},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.321399986743927},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.31060001254081726},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.2867000102996826},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icvisp68610.2025.11451680","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icvisp68610.2025.11451680","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 9th International Conference on Vision, Image and Signal Processing (ICVISP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W183625566","https://openalex.org/W1995341919","https://openalex.org/W2164383578","https://openalex.org/W2909384861","https://openalex.org/W2964105864","https://openalex.org/W3012255272","https://openalex.org/W3034312118","https://openalex.org/W3035524453","https://openalex.org/W3093147807","https://openalex.org/W3096805028","https://openalex.org/W3159481202","https://openalex.org/W3171007011","https://openalex.org/W3173788280","https://openalex.org/W3173908982","https://openalex.org/W3197005357","https://openalex.org/W3205249428","https://openalex.org/W4214562728","https://openalex.org/W4221141660","https://openalex.org/W4292133509","https://openalex.org/W4312282457","https://openalex.org/W4312430245","https://openalex.org/W4312589513","https://openalex.org/W4313166619","https://openalex.org/W4319300692","https://openalex.org/W4323338297","https://openalex.org/W4386076551","https://openalex.org/W4392507002","https://openalex.org/W4400486605","https://openalex.org/W4402510265","https://openalex.org/W4402768659","https://openalex.org/W4408326908","https://openalex.org/W4414989222","https://openalex.org/W7133228441","https://openalex.org/W7133261799"],"related_works":[],"abstract_inverted_index":{"To":[0],"tackle":[1],"the":[2,25,35,43,55,81,90,106,109,121,141,147,153,168],"issue":[3],"that":[4,101,167],"existing":[5],"models":[6],"lack":[7],"adequate":[8],"feature":[9,47,158],"extraction":[10,159],"capacity":[11],"in":[12,140,156,181],"few-shot":[13,182],"image":[14,183],"classification":[15,22],"scenarios,":[16],"this":[17],"paper":[18],"proposes":[19],"a":[20,60,66],"novel":[21],"algorithm":[23,44,170],"integrating":[24],"k-nearest":[26],"neighbor":[27],"attention":[28,57,92],"mechanism":[29,58,93],"and":[30,50,59,75,160],"hierarchical":[31,36,67,86],"cascaded":[32,37,68],"Transformer.":[33],"With":[34],"Transformer":[38],"as":[39],"its":[40,179],"basic":[41],"architecture,":[42],"significantly":[45],"improves":[46],"representation":[48],"capability":[49],"computational":[51,110],"efficiency":[52],"by":[53],"introducing":[54],"k-NN":[56],"depthwise":[61,135],"separable":[62,136],"convolution":[63,137],"module.":[64],"Firstly,":[65],"structure":[69],"is":[70,94,138],"adopted":[71],"to":[72,84,96,105,114],"progressively":[73],"extract":[74],"fuse":[76],"multi-scale":[77],"features,":[78],"which":[79,145],"enhances":[80],"model\u2019s":[82,122,154],"ability":[83],"perceive":[85],"semantic":[87],"information.":[88],"Secondly,":[89],"$\\mathbf{k}$-NN":[91],"utilized":[95],"dynamically":[97],"select":[98],"key-value":[99],"pairs":[100],"are":[102],"most":[103],"relevant":[104],"query,":[107],"reducing":[108],"complexity":[111],"from":[112],"$O\\left(N^{2}\\right)$":[113],"$O(k":[115],"N)$.":[116],"This":[117],"not":[118],"only":[119],"maintains":[120],"focus":[123],"on":[124],"key":[125],"regions":[126],"but":[127],"also":[128],"effectively":[129],"filters":[130],"out":[131],"noisy":[132],"tokens.":[133],"Finally,":[134],"embedded":[139],"feed-forward":[142],"network":[143],"(FFN),":[144],"reduces":[146],"number":[148],"of":[149],"parameters":[150],"while":[151],"enhancing":[152],"capabilities":[155],"local":[157],"long-range":[161],"dependency":[162],"modeling.":[163],"Experimental":[164],"results":[165],"show":[166],"proposed":[169],"achieves":[171],"leading":[172],"performance":[173],"compared":[174],"with":[175],"other":[176],"methods,":[177],"verifying":[178],"effectiveness":[180],"classification.":[184]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
