{"id":"https://openalex.org/W4391709421","doi":"https://doi.org/10.48550/arxiv.2402.05294","title":"Examining Modality Incongruity in Multimodal Federated Learning for Medical Vision and Language-based Disease Detection","display_name":"Examining Modality Incongruity in Multimodal Federated Learning for Medical Vision and Language-based Disease Detection","publication_year":2024,"publication_date":"2024-02-07","ids":{"openalex":"https://openalex.org/W4391709421","doi":"https://doi.org/10.48550/arxiv.2402.05294"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2402.05294","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.05294","pdf_url":"https://arxiv.org/pdf/2402.05294","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2402.05294","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109583051","display_name":"Pramit Saha","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Saha, Pramit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045635805","display_name":"Divyanshu Mishra","orcid":"https://orcid.org/0000-0002-3264-8739"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mishra, Divyanshu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046908638","display_name":"F. Wagner","orcid":"https://orcid.org/0000-0001-5687-6392"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wagner, Felix","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001104721","display_name":"Konstantinos Kamnitsas","orcid":"https://orcid.org/0000-0003-3281-6509"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kamnitsas, Konstantinos","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5077728082","display_name":"J. Alison Noble","orcid":"https://orcid.org/0000-0002-3060-3772"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Noble, J. Alison","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5109583051"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14222","display_name":"Knowledge Management and Technology","score":0.3540000021457672,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T14222","display_name":"Knowledge Management and Technology","score":0.3540000021457672,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10862","display_name":"AI in cancer detection","score":0.3070000112056732,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12734","display_name":"Information Systems and Technology Applications","score":0.29910001158714294,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.7534021139144897},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.575896680355072},{"id":"https://openalex.org/keywords/multimodal-learning","display_name":"Multimodal learning","score":0.5419908165931702},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.5015373229980469},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4129122495651245},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.09874376654624939}],"concepts":[{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.7534021139144897},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.575896680355072},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.5419908165931702},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.5015373229980469},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4129122495651245},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.09874376654624939}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2402.05294","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.05294","pdf_url":"https://arxiv.org/pdf/2402.05294","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2402.05294","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2402.05294","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2402.05294","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.05294","pdf_url":"https://arxiv.org/pdf/2402.05294","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3093803775","https://openalex.org/W3157841754","https://openalex.org/W4381827277","https://openalex.org/W2563212008","https://openalex.org/W4390136517","https://openalex.org/W3013953798","https://openalex.org/W2477990774","https://openalex.org/W3167558523","https://openalex.org/W3120825179","https://openalex.org/W2014028898"],"abstract_inverted_index":{"Multimodal":[0],"Federated":[1,15],"Learning":[2,16],"(MMFL)":[3],"utilizes":[4],"multiple":[5],"modalities":[6],"in":[7,29,102,113,120],"each":[8],"client":[9,116],"to":[10],"build":[11],"a":[12,107,114],"more":[13,74],"powerful":[14],"(FL)":[17],"model":[18],"than":[19,76],"its":[20,54,125],"unimodal":[21,69,77,121],"counterpart.":[22],"However,":[23],"the":[24,43,47,92,129,136],"impact":[25,48],"of":[26,49,85,94,138],"missing":[27,130],"modality":[28,34,50,108,118,131,146],"different":[30],"clients,":[31],"also":[32],"called":[33],"incongruity,":[35],"has":[36],"been":[37],"greatly":[38],"overlooked.":[39],"This":[40],"paper,":[41],"for":[42,117],"first":[44],"time,":[45],"analyses":[46],"incongruity":[51,147],"and":[52,70,123,140,163,168],"reveals":[53],"connection":[55],"with":[56,68,165],"data":[57],"heterogeneity":[58],"across":[59],"participating":[60],"clients.":[61],"We":[62],"particularly":[63],"inspect":[64],"whether":[65],"incongruent":[66],"MMFL":[67,154],"multimodal":[71,115],"clients":[72,122],"is":[73],"beneficial":[75],"FL.":[78],"Furthermore,":[79],"we":[80,90,105,134],"examine":[81],"three":[82],"potential":[83,126],"routes":[84],"addressing":[86],"this":[87],"issue.":[88],"Firstly,":[89],"study":[91],"effectiveness":[93],"various":[95],"self-attention":[96],"mechanisms":[97],"towards":[98,127,144],"incongruity-agnostic":[99],"information":[100],"fusion":[101],"MMFL.":[103],"Secondly,":[104],"introduce":[106],"imputation":[109],"network":[110],"(MIN)":[111],"pre-trained":[112],"translation":[119],"investigate":[124],"mitigating":[128,145],"problem.":[132],"Thirdly,":[133],"assess":[135],"capability":[137],"client-level":[139],"server-level":[141],"regularization":[142],"techniques":[143],"effects.":[148],"Experiments":[149],"are":[150],"conducted":[151],"under":[152],"several":[153],"settings":[155],"on":[156],"two":[157],"publicly":[158],"available":[159],"real-world":[160],"datasets,":[161],"MIMIC-CXR":[162],"Open-I,":[164],"Chest":[166],"X-Ray":[167],"radiology":[169],"reports.":[170]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2024-02-10T00:00:00"}
