{"id":"https://openalex.org/W7138081668","doi":"https://doi.org/10.1609/aaai.v40i9.37635","title":"Frequency-Aligned Cross-Modal Learning with Top-K Wavelet Fusion and Dynamic Expert Routing for Enhanced Retinal Disease Diagnosis","display_name":"Frequency-Aligned Cross-Modal Learning with Top-K Wavelet Fusion and Dynamic Expert Routing for Enhanced Retinal Disease Diagnosis","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138081668","doi":"https://doi.org/10.1609/aaai.v40i9.37635"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v40i9.37635","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i9.37635","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37635/41597","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37635/41597","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071481265","display_name":"Yuxin Lin","orcid":"https://orcid.org/0000-0002-3375-1383"},"institutions":[{"id":"https://openalex.org/I158809036","display_name":"Shenzhen Institute of Information Technology","ror":"https://ror.org/03wrf9427","country_code":"CN","type":"education","lineage":["https://openalex.org/I158809036"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuxin Lin","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen\nShenzhen Key Laboratory of Visual Object Detection and Recognition"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen\nShenzhen Key Laboratory of Visual Object Detection and Recognition","institution_ids":["https://openalex.org/I204983213","https://openalex.org/I158809036"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129733460","display_name":"Haoran Li","orcid":null},"institutions":[{"id":"https://openalex.org/I204824540","display_name":"University of Wollongong","ror":"https://ror.org/00jtmb277","country_code":"AU","type":"education","lineage":["https://openalex.org/I204824540"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Haoran Li","raw_affiliation_strings":["School of Information Technology, University of Wollongong"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Information Technology, University of Wollongong","institution_ids":["https://openalex.org/I204824540"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129699042","display_name":"Haoyu Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoyu Cao","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067821096","display_name":"Yongting Hu","orcid":"https://orcid.org/0000-0003-3924-3547"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongting Hu","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102635057","display_name":"QiHao Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qihao Xu","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129657907","display_name":"Chengliang Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]},{"id":"https://openalex.org/I4210164862","display_name":"Artificial Intelligence in Medicine (Canada)","ror":"https://ror.org/05p590m36","country_code":"CA","type":"company","lineage":["https://openalex.org/I4210164862"]}],"countries":["CA","HK"],"is_corresponding":false,"raw_author_name":"Chengliang Liu","raw_affiliation_strings":["Laboratory for Artificial Intelligence in Design, The Hong Kong Polytechnic University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Laboratory for Artificial Intelligence in Design, The Hong Kong Polytechnic University","institution_ids":["https://openalex.org/I14243506","https://openalex.org/I4210164862"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129730191","display_name":"Xiaoling Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoling Luo","raw_affiliation_strings":["College of Computer Science and Software Engineering, Shenzhen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Software Engineering, Shenzhen University","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129641085","display_name":"Zhihao Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhihao Wu","raw_affiliation_strings":["School of Artificial Intelligence, Shenzhen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Shenzhen University","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129658132","display_name":"Yong Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I158809036","display_name":"Shenzhen Institute of Information Technology","ror":"https://ror.org/03wrf9427","country_code":"CN","type":"education","lineage":["https://openalex.org/I158809036"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Xu","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen\nShenzhen Key Laboratory of Visual Object Detection and Recognition"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen\nShenzhen Key Laboratory of Visual Object Detection and Recognition","institution_ids":["https://openalex.org/I204983213","https://openalex.org/I158809036"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129667449","display_name":"Wei Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Wang","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5071481265"],"corresponding_institution_ids":["https://openalex.org/I158809036","https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.28125,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"9","first_page":"7006","last_page":"7014"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11438","display_name":"Retinal Imaging and Analysis","score":0.8921999931335449,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11438","display_name":"Retinal Imaging and Analysis","score":0.8921999931335449,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10170","display_name":"Retinal Diseases and Treatments","score":0.02459999918937683,"subfield":{"id":"https://openalex.org/subfields/2731","display_name":"Ophthalmology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12599","display_name":"Retinal and Optic Conditions","score":0.006899999920278788,"subfield":{"id":"https://openalex.org/subfields/2731","display_name":"Ophthalmology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6359999775886536},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.498199999332428},{"id":"https://openalex.org/keywords/concatenation","display_name":"Concatenation (mathematics)","score":0.4936000108718872},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4918000102043152},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.48100000619888306},{"id":"https://openalex.org/keywords/wavelet","display_name":"Wavelet","score":0.4794999957084656},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.4487000107765198}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7337999939918518},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7127000093460083},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6359999775886536},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.498199999332428},{"id":"https://openalex.org/C87619178","wikidata":"https://www.wikidata.org/wiki/Q126002","display_name":"Concatenation (mathematics)","level":2,"score":0.4936000108718872},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4918000102043152},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.48100000619888306},{"id":"https://openalex.org/C47432892","wikidata":"https://www.wikidata.org/wiki/Q831390","display_name":"Wavelet","level":2,"score":0.4794999957084656},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.4487000107765198},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4302999973297119},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.40470001101493835},{"id":"https://openalex.org/C196216189","wikidata":"https://www.wikidata.org/wiki/Q2867","display_name":"Wavelet transform","level":3,"score":0.352400004863739},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3492000102996826},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3203999996185303},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.30169999599456787},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.273499995470047},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C46286280","wikidata":"https://www.wikidata.org/wiki/Q2414958","display_name":"Discrete wavelet transform","level":4,"score":0.259799987077713}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1609/aaai.v40i9.37635","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i9.37635","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37635/41597","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:ojs.aaai.org:article/37635","is_oa":false,"landing_page_url":"https://ojs.aaai.org/index.php/AAAI/article/view/37635","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2159-5399","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i9.37635","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i9.37635","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37635/41597","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.6418811082839966,"display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G620410641","display_name":null,"funder_award_id":"62102339","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138081668.pdf","grobid_xml":"https://content.openalex.org/works/W7138081668.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multimodal":[0],"fusion":[1,28,57,185],"of":[2,46],"color":[3],"fundus":[4],"photography":[5],"(CFP)":[6],"and":[7,62,110,129,194],"optical":[8],"coherence":[9],"tomography":[10],"(OCT)":[11],"B-scan":[12],"images":[13],"has":[14],"demonstrated":[15],"superior":[16],"diagnostic":[17],"potential":[18],"for":[19,66],"retinal":[20,174],"diseases":[21],"compared":[22],"to":[23,108,123,138,161],"single-modality":[24],"approaches.":[25],"However,":[26],"existing":[27,184],"paradigms":[29],"-":[30,38],"whether":[31],"through":[32],"naive":[33],"concatenation":[34],"or":[35],"attention":[36,133],"mechanisms":[37],"treat":[39],"cross-modal":[40],"interactions":[41],"indiscriminately,":[42],"lacking":[43],"adaptive":[44,56],"modulation":[45],"modality-specific":[47],"contributions":[48],"under":[49],"varying":[50],"clinical":[51],"scenarios.":[52],"We":[53],"propose":[54],"an":[55],"framework":[58,71],"that":[59,177],"dynamically":[60],"routes":[61],"refines":[63],"multimodal":[64,173],"signals":[65],"enhancing":[67],"disease":[68,191],"recognition.":[69],"The":[70],"comprises":[72],"two":[73,172],"key":[74],"components:":[75],"1)":[76],"Dynamic":[77],"Cross-Modal":[78],"Expert":[79],"Routing":[80],"(CMER),":[81],"which":[82,117],"selectively":[83],"activates":[84],"convolutional":[85],"neural":[86],"network":[87],"(CNN)":[88],"experts":[89],"from":[90,97],"one":[91],"modality":[92,164],"based":[93],"on":[94,171],"contextual":[95],"guidance":[96],"the":[98,102,153],"other,":[99],"ensuring":[100],"only":[101],"most":[103],"relevant":[104],"feature":[105],"extractors":[106],"contribute":[107],"fusion;":[109],"2)":[111],"Top-K":[112],"Expert-Guided":[113],"Wavelet":[114],"Fusion":[115],"(TEWF),":[116],"performs":[118],"discrete":[119],"wavelet":[120],"transform":[121],"(DWT)":[122],"decompose":[124],"selected":[125],"features":[126],"into":[127],"low-":[128],"high-frequency":[130,139],"subbands.":[131],"Cross-modal":[132],"is":[134],"then":[135],"applied":[136],"specifically":[137],"components,":[140],"where":[141],"lesion-specific":[142],"microstructures":[143],"reside,":[144],"enabling":[145],"frequency-aware":[146],"fusion.":[147],"Finally,":[148],"inverse":[149],"DWT":[150],"(IDWT)":[151],"reconstructs":[152],"fused":[154],"representation,":[155],"weighted":[156],"by":[157,187],"CMER-derived":[158],"importance":[159],"scores":[160],"amplify":[162],"informative":[163],"cues":[165],"while":[166],"suppressing":[167],"redundancy.":[168],"Experimental":[169],"validation":[170],"datasets":[175],"demonstrates":[176],"our":[178],"method":[179],"achieves":[180],"state-of-the-art":[181],"performance,":[182],"outperforming":[183],"strategies":[186],"significant":[188],"margins":[189],"in":[190],"classification":[192],"accuracy":[193],"robustness.":[195]},"counts_by_year":[],"updated_date":"2026-06-06T09:05:17.133730","created_date":"2026-03-18T00:00:00"}
