{"id":"https://openalex.org/W7138266203","doi":"https://doi.org/10.1609/aaai.v40i11.37867","title":"CLUENet: Cluster Attention Makes Neural Networks Have Eyes","display_name":"CLUENet: Cluster Attention Makes Neural Networks Have Eyes","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138266203","doi":"https://doi.org/10.1609/aaai.v40i11.37867"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v40i11.37867","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i11.37867","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1609/aaai.v40i11.37867","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129664140","display_name":"Xiangshuai Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiangshuai Song","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129656696","display_name":"Jun-Jie Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jun-Jie Huang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129728771","display_name":"Tianrui Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tianrui Liu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129700156","display_name":"Ke Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ke Liang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129697844","display_name":"Chang Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chang Tang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.41452991,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"11","first_page":"9106","last_page":"9115"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.2777999937534332,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.2777999937534332,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.17309999465942383,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.1476999968290329,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.8881999850273132},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6173999905586243},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.588699996471405},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.5703999996185303},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.454800009727478},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43479999899864197},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.414900004863739},{"id":"https://openalex.org/keywords/limit","display_name":"Limit (mathematics)","score":0.36230000853538513}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.8881999850273132},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.796999990940094},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7038999795913696},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6173999905586243},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.588699996471405},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.5703999996185303},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.454800009727478},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43479999899864197},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.414900004863739},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3659000098705292},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.36230000853538513},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.36059999465942383},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.35899999737739563},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3434999883174896},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.3361000120639801},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3160000145435333},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2851000130176544},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.260699987411499},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.25870001316070557},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.2556999921798706},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.2542000114917755}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1609/aaai.v40i11.37867","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i11.37867","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:ojs.aaai.org:article/37867","is_oa":false,"landing_page_url":"https://ojs.aaai.org/index.php/AAAI/article/view/37867","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2159-5399","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i11.37867","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i11.37867","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G284619639","display_name":null,"funder_award_id":"62522604","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G392162762","display_name":null,"funder_award_id":"62506371","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5084851867","display_name":null,"funder_award_id":"62201600","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5384871634","display_name":null,"funder_award_id":"62201604","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6330077812","display_name":null,"funder_award_id":"62476258","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Despite":[0],"the":[1,65],"success":[2],"of":[3,153],"convolution-":[4],"and":[5,15,26,43,54,88,101,112,116,130,136,145,156],"attention-based":[6],"models":[7],"in":[8],"vision":[9],"tasks,":[10],"their":[11,19],"rigid":[12],"receptive":[13],"fields":[14],"complex":[16],"architectures":[17],"limit":[18],"ability":[20],"to":[21],"model":[22,36],"irregular":[23],"spatial":[24],"patterns":[25],"hinder":[27],"interpretability,":[28],"thereby":[29],"posing":[30],"challenges":[31],"for":[32,74,97,106],"tasks":[33],"requiring":[34],"high":[35],"transparency.":[37,157],"Clustering":[38],"paradigms":[39],"offer":[40],"promising":[41],"interpretability":[42],"flexible":[44],"semantic":[45,76],"modeling,":[46,109],"but":[47],"suffer":[48],"from":[49],"limited":[50],"accuracy,":[51,154],"low":[52],"efficiency,":[53,155],"gradient":[55],"vanishing":[56],"during":[57],"training.":[58],"To":[59],"address":[60],"these":[61],"issues,":[62],"we":[63,79],"propose":[64],"CLUster":[66],"attEntion":[67],"Network":[68],"(CLUENet),":[69],"a":[70,86,93,102,150],"transparent":[71],"deep":[72],"architecture":[73],"visual":[75,131,147],"understanding.":[77],"Specifically,":[78],"introduce":[80],"three":[81],"key":[82],"innovations,":[83],"including":[84],"(i)":[85],"Global":[87],"Soft":[89],"Feature":[90,114],"Aggregation":[91],"with":[92],"Temperature-Scaled":[94],"Cosine":[95],"Attention":[96],"capturing":[98],"long-range":[99],"dependencies":[100],"Gated":[103],"Fusion":[104],"Mechanism":[105],"enhanced":[107],"local":[108],"(ii)":[110],"Hard":[111],"Shared":[113],"Dispatching,":[115],"(iii)":[117],"an":[118],"Improved":[119],"Cluster":[120],"Pooling":[121],"Block.":[122],"These":[123],"enhancements":[124],"significantly":[125],"improve":[126],"both":[127],"classification":[128],"performance":[129],"interpretability.":[132],"Experiments":[133],"on":[134],"CIFAR-100":[135],"Mini-ImageNet":[137],"demonstrate":[138],"that":[139],"CLUENet":[140],"outperforms":[141],"existing":[142],"clustering":[143],"methods":[144],"mainstream":[146],"models,":[148],"offering":[149],"compelling":[151],"balance":[152]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-18T00:00:00"}
