{"id":"https://openalex.org/W7138222100","doi":"https://doi.org/10.1609/aaai.v40i24.39093","title":"PROMISE: Prompt-Attentive Hierarchical Contrastive Learning for Robust Cross-Modal Representation with Missing Modalities","display_name":"PROMISE: Prompt-Attentive Hierarchical Contrastive Learning for Robust Cross-Modal Representation with Missing Modalities","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138222100","doi":"https://doi.org/10.1609/aaai.v40i24.39093"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i24.39093","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i24.39093","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/39093/43055","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/39093/43055","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129697871","display_name":"Jiajun Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiajun Chen","raw_affiliation_strings":["Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110693484","display_name":"Sai Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sai Cheng","raw_affiliation_strings":["Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023507742","display_name":"YUAN Li Min Yutao","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan Yutao","raw_affiliation_strings":["Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019656902","display_name":"Yirui Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"YiRui Zhang","raw_affiliation_strings":["Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002395365","display_name":"Haitao Yuan","orcid":"https://orcid.org/0000-0001-6721-065X"},"institutions":[{"id":"https://openalex.org/I128590013","display_name":"National Technological University","ror":"https://ror.org/04t730v47","country_code":"AR","type":"education","lineage":["https://openalex.org/I128590013"]},{"id":"https://openalex.org/I4210090124","display_name":"Tecnol\u00f3gico Nacional de M\u00e9xico","ror":"https://ror.org/00davry38","country_code":"MX","type":"government","lineage":["https://openalex.org/I1302736544","https://openalex.org/I4210090124","https://openalex.org/I4405258672"]}],"countries":["AR","MX"],"is_corresponding":false,"raw_author_name":"Haitao Yuan","raw_affiliation_strings":["National Technological University"],"affiliations":[{"raw_affiliation_string":"National Technological University","institution_ids":["https://openalex.org/I4210090124","https://openalex.org/I128590013"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129673195","display_name":"Peng Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Peng","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129703032","display_name":"Yi Zhong","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Zhong","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5129697871"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.45,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"24","first_page":"20076","last_page":"20082"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9593999981880188,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9593999981880188,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.009999999776482582,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.00430000014603138,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.7678999900817871},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5885999798774719},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.5455999970436096},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.5008000135421753},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.49470001459121704},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.489300012588501},{"id":"https://openalex.org/keywords/multimodal-learning","display_name":"Multimodal learning","score":0.4611000120639801}],"concepts":[{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.7678999900817871},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7414000034332275},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7211999893188477},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5885999798774719},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.5455999970436096},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.5008000135421753},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.49470001459121704},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.489300012588501},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.486299991607666},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.4611000120639801},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.4505000114440918},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.40209999680519104},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.37549999356269836},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3646000027656555},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.358599990606308},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.352400004863739},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.2632000148296356},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i24.39093","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i24.39093","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/39093/43055","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i24.39093","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i24.39093","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/39093/43055","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138222100.pdf","grobid_xml":"https://content.openalex.org/works/W7138222100.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multimodal":[0],"models":[1],"integrating":[2],"natural":[3],"language":[4],"and":[5,41,123,141],"visual":[6],"information":[7],"have":[8],"substantially":[9],"improved":[10],"emotion":[11],"recognition":[12],"performance.":[13,68],"However,":[14],"their":[15],"effectiveness":[16],"significantly":[17],"declines":[18],"in":[19],"real-world":[20],"situations":[21],"where":[22,128],"certain":[23],"modalities":[24,50,130],"are":[25,131],"missing":[26,49,96],"or":[27],"unavailable.":[28],"This":[29,118],"degradation":[30],"primarily":[31],"stems":[32],"from":[33],"inconsistent":[34],"representation":[35,92],"learning":[36,104,109],"between":[37,139],"complete":[38,140],"multimodal":[39,77,102,166],"data":[40],"incomplete":[42,142],"modality":[43],"scenarios.":[44],"Existing":[45],"approaches":[46,58],"typically":[47],"address":[48],"through":[51],"relatively":[52],"simplistic":[53],"generation":[54],"methods,":[55],"yet":[56],"these":[57],"fail":[59],"to":[60,66,163],"adequately":[61],"preserve":[62],"cross-modal":[63,91],"consistency,":[64],"leading":[65],"suboptimal":[67],"To":[69],"overcome":[70],"this":[71],"limitation,":[72],"we":[73],"propose":[74],"a":[75,81,106,113],"novel":[76],"framework":[78],"named":[79],"PROMISE,":[80],"prompting-Attentive":[82],"Hierarchical":[83],"Contrastive":[84],"Learning":[85],"approach":[86],"designed":[87,115],"explicitly":[88],"for":[89,126],"robust":[90,122],"under":[93],"conditions":[94],"of":[95,160],"modalities.":[97],"Specifically,":[98],"Promise":[99],"innovatively":[100],"incorporates":[101],"prompt":[103],"into":[105],"hierarchical":[107],"contrastive":[108],"framework,":[110],"equipped":[111],"with":[112,151],"specially":[114],"prompting-attention":[116],"mechanism.":[117],"mechanism":[119],"dynamically":[120],"generates":[121],"consistent":[124],"representations":[125],"scenarios":[127],"particular":[129],"absent,":[132],"thereby":[133],"effectively":[134],"bridging":[135],"the":[136,157],"representational":[137],"gap":[138],"data.":[143],"Extensive":[144],"experiments":[145],"conducted":[146],"on":[147],"benchmark":[148],"datasets,":[149],"along":[150],"comprehensive":[152],"ablation":[153],"studies,":[154],"clearly":[155],"demonstrate":[156],"superior":[158],"performance":[159],"PROMISE":[161],"compared":[162],"current":[164],"state-of-the-art":[165],"methods.":[167]},"counts_by_year":[],"updated_date":"2026-03-20T20:47:17.329874","created_date":"2026-03-18T00:00:00"}
