{"id":"https://openalex.org/W7124441542","doi":"https://doi.org/10.1109/tmm.2026.3654379","title":"Heterogeneous Multimodal Federated Learning With Missing Modality via Mask-Restoration and Self-Guidance","display_name":"Heterogeneous Multimodal Federated Learning With Missing Modality via Mask-Restoration and Self-Guidance","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7124441542","doi":"https://doi.org/10.1109/tmm.2026.3654379"},"language":null,"primary_location":{"id":"doi:10.1109/tmm.2026.3654379","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2026.3654379","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123233838","display_name":"Zhibo Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090767","display_name":"Ministry of Education","ror":"https://ror.org/00b3tsf98","country_code":"RW","type":"government","lineage":["https://openalex.org/I4210090767"]}],"countries":["RW"],"is_corresponding":false,"raw_author_name":"Zhibo Cao","raw_affiliation_strings":["Engineering Research Center of Digitized Textile and Apparel Technology, Ministry of Education, School of Information and Intelligent Science, Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0008-4698-5470","affiliations":[{"raw_affiliation_string":"Engineering Research Center of Digitized Textile and Apparel Technology, Ministry of Education, School of Information and Intelligent Science, Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I4210090767"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075093436","display_name":"Kuangrong Hao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090767","display_name":"Ministry of Education","ror":"https://ror.org/00b3tsf98","country_code":"RW","type":"government","lineage":["https://openalex.org/I4210090767"]}],"countries":["RW"],"is_corresponding":false,"raw_author_name":"Kuangrong Hao","raw_affiliation_strings":["Engineering Research Center of Digitized Textile and Apparel Technology, Ministry of Education, School of Information and Intelligent Science, Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-9672-6161","affiliations":[{"raw_affiliation_string":"Engineering Research Center of Digitized Textile and Apparel Technology, Ministry of Education, School of Information and Intelligent Science, Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I4210090767"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123180928","display_name":"Lingguang Hao","orcid":null},"institutions":[{"id":"https://openalex.org/I9086337","display_name":"Taiyuan University of Technology","ror":"https://ror.org/03kv08d37","country_code":"CN","type":"education","lineage":["https://openalex.org/I9086337"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lingguang Hao","raw_affiliation_strings":["College of Electrical and Power Engineering, Taiyuan University of Technology, Taiyuan, China"],"raw_orcid":"https://orcid.org/0009-0003-8111-6143","affiliations":[{"raw_affiliation_string":"College of Electrical and Power Engineering, Taiyuan University of Technology, Taiyuan, China","institution_ids":["https://openalex.org/I9086337"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064572247","display_name":"Bing Wei","orcid":"https://orcid.org/0000-0002-2298-1474"},"institutions":[{"id":"https://openalex.org/I4210090767","display_name":"Ministry of Education","ror":"https://ror.org/00b3tsf98","country_code":"RW","type":"government","lineage":["https://openalex.org/I4210090767"]}],"countries":["RW"],"is_corresponding":false,"raw_author_name":"Bing Wei","raw_affiliation_strings":["Engineering Research Center of Digitized Textile and Apparel Technology, Ministry of Education, School of Information and Intelligent Science, Donghua University, Shanghai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Engineering Research Center of Digitized Textile and Apparel Technology, Ministry of Education, School of Information and Intelligent Science, Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I4210090767"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069677894","display_name":"Lihong Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090767","display_name":"Ministry of Education","ror":"https://ror.org/00b3tsf98","country_code":"RW","type":"government","lineage":["https://openalex.org/I4210090767"]}],"countries":["RW"],"is_corresponding":false,"raw_author_name":"Lihong Ren","raw_affiliation_strings":["Engineering Research Center of Digitized Textile and Apparel Technology, Ministry of Education, School of Information and Intelligent Science, Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0004-4451-5994","affiliations":[{"raw_affiliation_string":"Engineering Research Center of Digitized Textile and Apparel Technology, Ministry of Education, School of Information and Intelligent Science, Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I4210090767"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07330412,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"28","issue":null,"first_page":"3571","last_page":"3583"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.6190999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.6190999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.09040000289678574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.026900000870227814,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6812000274658203},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6707000136375427},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.6144000291824341},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5630000233650208},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4560999870300293},{"id":"https://openalex.org/keywords/multimodal-learning","display_name":"Multimodal learning","score":0.4189000129699707},{"id":"https://openalex.org/keywords/masking","display_name":"Masking (illustration)","score":0.4050999879837036},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3962000012397766}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8913999795913696},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6812000274658203},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6707000136375427},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.6144000291824341},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5654000043869019},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5630000233650208},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4578999876976013},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4560999870300293},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.4189000129699707},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.4050999879837036},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3962000012397766},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3898000121116638},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.3671000003814697},{"id":"https://openalex.org/C2992525071","wikidata":"https://www.wikidata.org/wiki/Q50818671","display_name":"Federated learning","level":2,"score":0.3547999858856201},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3440000116825104},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.33469998836517334},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3127000033855438},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.3034999966621399},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.28850001096725464},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.2703999876976013},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.26899999380111694},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.265500009059906},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.2583000063896179},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2026.3654379","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2026.3654379","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Federated":[0,104],"learning":[1,49],"(FL)":[2],"is":[3],"well-suited":[4],"for":[5,214],"multimodal":[6,47,68,103,185],"tasks":[7],"due":[8],"to":[9,12,40,71,117,127,152,169,188,192],"its":[10],"ability":[11],"protect":[13],"privacy":[14],"and":[15,66,108,156,204],"support":[16],"local":[17],"training.":[18],"However,":[19],"the":[20,82,88,125,143,150,171,184,194,197,208,211],"complexity":[21],"of":[22,58,84,131,174,196,210],"real-world":[23,95],"sensor":[24],"environments":[25],"causes":[26],"modality":[27,59,180,190],"heterogeneity":[28],"across":[29,178],"clients.":[30,69,181],"Some":[31],"modalities":[32],"may":[33,91],"be":[34,92],"missing":[35,77,119,132,157,216],"altogether,":[36],"making":[37],"it":[38],"difficult":[39],"construct":[41],"a":[42,100,114,164,175],"generalized":[43],"global":[44,176,198],"model.":[45,199],"Existing":[46],"federated":[48],"methods":[50],"often":[51],"address":[52],"modality-missing":[53],"scenarios":[54],"under":[55],"simplified":[56],"assumptions":[57],"heterogeneity,":[60],"typically":[61],"focusing":[62],"on":[63,202],"unimodal":[64],"clients":[65],"modality-complete":[67],"Moreover,":[70],"mitigate":[72],"performance":[73],"degradation":[74],"caused":[75],"by":[76],"modalities,":[78],"some":[79],"approaches":[80],"assume":[81],"availability":[83],"auxiliary":[85],"information":[86],"at":[87],"server,":[89],"which":[90],"impractical":[93],"in":[94],"scenarios.":[96],"Therefore,":[97],"we":[98,135,162],"propose":[99,163],"novel":[101],"heterogeneous":[102,179],"Learning":[105],"with":[106],"Mask-Restoration":[107,112],"Self-Guidance":[109],"(FL-MRSG).":[110],"The":[111],"employs":[113],"masking":[115],"strategy":[116,168],"simulate":[118],"data":[120,145,158],"during":[121],"feature":[122],"extraction,":[123],"enabling":[124,149],"network":[126,151],"learn":[128],"semantic":[129],"features":[130],"modality.":[133],"Furthermore,":[134],"introduce":[136],"an":[137],"innovative":[138],"self-guidance":[139],"mechanism":[140],"that":[141],"leverages":[142],"restored":[144],"as":[146],"guidance":[147],"information,":[148],"distinguish":[153],"between":[154],"complete":[155],"representations.":[159],"In":[160],"addition,":[161],"personalized":[165],"decoupled":[166],"aggregation":[167],"facilitate":[170],"collaborative":[172],"training":[173],"model":[177],"We":[182],"extend":[183],"test":[186],"set":[187],"arbitrary":[189,215],"combinations":[191],"evaluate":[193],"robustness":[195],"Extensive":[200],"experiments":[201],"MOSI":[203],"SIMS":[205],"datasets":[206],"demonstrate":[207],"effectiveness":[209],"proposed":[212],"FL-MRSG":[213],"modalities.":[217]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-01-17T00:00:00"}
