{"id":"https://openalex.org/W4390730260","doi":"https://doi.org/10.1109/tcsvt.2024.3351601","title":"A Survey of Cross-Modal Visual Content Generation","display_name":"A Survey of Cross-Modal Visual Content Generation","publication_year":2024,"publication_date":"2024-01-09","ids":{"openalex":"https://openalex.org/W4390730260","doi":"https://doi.org/10.1109/tcsvt.2024.3351601"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3351601","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3351601","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068705264","display_name":"Fatemeh Nazarieh","orcid":"https://orcid.org/0000-0001-6917-6969"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Fatemeh Nazarieh","raw_affiliation_strings":["School of Computer Science and Electronic Engineering and the Nature Inspired Computing and Engineering (NICE) Research Group, University of Surrey, Guildford, U.K","School of Computer Science and Electronic Engineering, and the Nature Inspired Computing and Engineering (NICE) research group, University of Surrey, Guildford, UK"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Electronic Engineering and the Nature Inspired Computing and Engineering (NICE) Research Group, University of Surrey, Guildford, U.K","institution_ids":["https://openalex.org/I28290843"]},{"raw_affiliation_string":"School of Computer Science and Electronic Engineering, and the Nature Inspired Computing and Engineering (NICE) research group, University of Surrey, Guildford, UK","institution_ids":["https://openalex.org/I28290843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025299678","display_name":"Zhenhua Feng","orcid":"https://orcid.org/0000-0002-4485-4249"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhenhua Feng","raw_affiliation_strings":["School of Computer Science and Electronic Engineering and the Nature Inspired Computing and Engineering (NICE) Research Group, University of Surrey, Guildford, U.K","School of Computer Science and Electronic Engineering, and the Nature Inspired Computing and Engineering (NICE) research group, University of Surrey, Guildford, UK"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Electronic Engineering and the Nature Inspired Computing and Engineering (NICE) Research Group, University of Surrey, Guildford, U.K","institution_ids":["https://openalex.org/I28290843"]},{"raw_affiliation_string":"School of Computer Science and Electronic Engineering, and the Nature Inspired Computing and Engineering (NICE) research group, University of Surrey, Guildford, UK","institution_ids":["https://openalex.org/I28290843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100778579","display_name":"Muhammad Awais","orcid":"https://orcid.org/0000-0002-1122-0709"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Muhammad Awais","raw_affiliation_strings":["Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K"],"affiliations":[{"raw_affiliation_string":"Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K","institution_ids":["https://openalex.org/I28290843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100676721","display_name":"Wenwu Wang","orcid":"https://orcid.org/0000-0002-8393-5703"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Wenwu Wang","raw_affiliation_strings":["Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K"],"affiliations":[{"raw_affiliation_string":"Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K","institution_ids":["https://openalex.org/I28290843"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028209738","display_name":"Josef Kittler","orcid":"https://orcid.org/0000-0002-8110-9205"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Josef Kittler","raw_affiliation_strings":["Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K"],"affiliations":[{"raw_affiliation_string":"Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K","institution_ids":["https://openalex.org/I28290843"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5068705264"],"corresponding_institution_ids":["https://openalex.org/I28290843"],"apc_list":null,"apc_paid":null,"fwci":5.3818,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.96618529,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"34","issue":"8","first_page":"6814","last_page":"6832"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9129999876022339,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8054155707359314},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.7678411602973938},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.6252275705337524},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5544092059135437},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5533099174499512},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.44658544659614563},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4461211860179901},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.44550809264183044},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.4179582893848419},{"id":"https://openalex.org/keywords/coherence","display_name":"Coherence (philosophical gambling strategy)","score":0.4149456322193146},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38204532861709595},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3564302921295166}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8054155707359314},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.7678411602973938},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.6252275705337524},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5544092059135437},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5533099174499512},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.44658544659614563},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4461211860179901},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.44550809264183044},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.4179582893848419},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.4149456322193146},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38204532861709595},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3564302921295166},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcsvt.2024.3351601","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3351601","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},{"id":"pmh:oai:alma.44SUR_INST:11199610990002346","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4210197018","display_name":"View","issn_l":"2688-268X","issn":["2688-268X","2688-3988"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6868706350","display_name":"Multimodal Video Search by Examples (MVSE)","funder_award_id":"EP/V002856/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G7111890331","display_name":null,"funder_award_id":"EP/V002856/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":172,"referenced_works":["https://openalex.org/W1797268635","https://openalex.org/W1861492603","https://openalex.org/W2007620009","https://openalex.org/W2015143272","https://openalex.org/W2026019603","https://openalex.org/W2030931454","https://openalex.org/W2062119563","https://openalex.org/W2065301447","https://openalex.org/W2075505763","https://openalex.org/W2080489767","https://openalex.org/W2098516422","https://openalex.org/W2099755684","https://openalex.org/W2108598243","https://openalex.org/W2119381621","https://openalex.org/W2133665775","https://openalex.org/W2151654057","https://openalex.org/W2163301185","https://openalex.org/W2232702494","https://openalex.org/W2249354239","https://openalex.org/W2466618734","https://openalex.org/W2474702929","https://openalex.org/W2551572271","https://openalex.org/W2556418146","https://openalex.org/W2594690981","https://openalex.org/W2620635248","https://openalex.org/W2738406145","https://openalex.org/W2741253951","https://openalex.org/W2752796333","https://openalex.org/W2782422271","https://openalex.org/W2808631503","https://openalex.org/W2883409523","https://openalex.org/W2897492344","https://openalex.org/W2901285216","https://openalex.org/W2902437806","https://openalex.org/W2912351236","https://openalex.org/W2962974533","https://openalex.org/W2963073614","https://openalex.org/W2963143316","https://openalex.org/W2963163163","https://openalex.org/W2963290645","https://openalex.org/W2963561004","https://openalex.org/W2963800363","https://openalex.org/W2963966654","https://openalex.org/W2964024144","https://openalex.org/W2971856312","https://openalex.org/W2973049979","https://openalex.org/W2978017171","https://openalex.org/W2979894294","https://openalex.org/W2982138396","https://openalex.org/W2982625143","https://openalex.org/W3007780968","https://openalex.org/W3009385801","https://openalex.org/W3019952993","https://openalex.org/W3023706973","https://openalex.org/W3068510429","https://openalex.org/W3081492798","https://openalex.org/W3085146247","https://openalex.org/W3092950464","https://openalex.org/W3099284785","https://openalex.org/W3100204393","https://openalex.org/W3100380967","https://openalex.org/W3101631197","https://openalex.org/W3109114891","https://openalex.org/W3118120400","https://openalex.org/W3125772723","https://openalex.org/W3145443213","https://openalex.org/W3153469116","https://openalex.org/W3153819643","https://openalex.org/W3153832461","https://openalex.org/W3158979919","https://openalex.org/W3173268697","https://openalex.org/W3176252609","https://openalex.org/W3176641147","https://openalex.org/W3177343422","https://openalex.org/W3185430283","https://openalex.org/W3196616669","https://openalex.org/W3196778134","https://openalex.org/W3197087768","https://openalex.org/W3197199219","https://openalex.org/W3204221554","https://openalex.org/W3209532394","https://openalex.org/W3212516020","https://openalex.org/W4214622647","https://openalex.org/W4221145616","https://openalex.org/W4224035735","https://openalex.org/W4225272741","https://openalex.org/W4226125322","https://openalex.org/W4281485151","https://openalex.org/W4281487277","https://openalex.org/W4281632497","https://openalex.org/W4281847696","https://openalex.org/W4286611314","https://openalex.org/W4288079574","https://openalex.org/W4288724078","https://openalex.org/W4289785095","https://openalex.org/W4297697565","https://openalex.org/W4297981470","https://openalex.org/W4298185919","https://openalex.org/W4303441850","https://openalex.org/W4311808636","https://openalex.org/W4312301053","https://openalex.org/W4312388283","https://openalex.org/W4312635677","https://openalex.org/W4312671789","https://openalex.org/W4312741694","https://openalex.org/W4312933868","https://openalex.org/W4313145975","https://openalex.org/W4313472219","https://openalex.org/W4315589026","https://openalex.org/W4317951215","https://openalex.org/W4319770604","https://openalex.org/W4320013936","https://openalex.org/W4320085220","https://openalex.org/W4323706279","https://openalex.org/W4327525621","https://openalex.org/W4327673614","https://openalex.org/W4377010269","https://openalex.org/W4378506819","https://openalex.org/W4385245566","https://openalex.org/W4385270985","https://openalex.org/W4386065402","https://openalex.org/W4386065807","https://openalex.org/W4386066462","https://openalex.org/W4386072096","https://openalex.org/W4386075487","https://openalex.org/W4386075819","https://openalex.org/W4386075888","https://openalex.org/W4386075993","https://openalex.org/W4386076001","https://openalex.org/W4386076250","https://openalex.org/W4386076405","https://openalex.org/W4386076617","https://openalex.org/W4389009369","https://openalex.org/W4390873382","https://openalex.org/W4393148714","https://openalex.org/W4394597549","https://openalex.org/W4402727926","https://openalex.org/W6683074461","https://openalex.org/W6718379498","https://openalex.org/W6735204497","https://openalex.org/W6737896281","https://openalex.org/W6748181857","https://openalex.org/W6756789066","https://openalex.org/W6765779288","https://openalex.org/W6768851824","https://openalex.org/W6776963518","https://openalex.org/W6779823529","https://openalex.org/W6781874425","https://openalex.org/W6783182287","https://openalex.org/W6790978476","https://openalex.org/W6791353385","https://openalex.org/W6793883596","https://openalex.org/W6796242362","https://openalex.org/W6802987763","https://openalex.org/W6809885388","https://openalex.org/W6810940779","https://openalex.org/W6811291704","https://openalex.org/W6838639034","https://openalex.org/W6838785959","https://openalex.org/W6838910450","https://openalex.org/W6838965156","https://openalex.org/W6841755765","https://openalex.org/W6844305113","https://openalex.org/W6846135447","https://openalex.org/W6849119191","https://openalex.org/W6849682310","https://openalex.org/W6849949366","https://openalex.org/W6850357939","https://openalex.org/W6850607732","https://openalex.org/W6850657078","https://openalex.org/W6853416641","https://openalex.org/W6853785652"],"related_works":["https://openalex.org/W73545470","https://openalex.org/W4224266612","https://openalex.org/W2383394264","https://openalex.org/W4320153225","https://openalex.org/W4293261942","https://openalex.org/W3125968744","https://openalex.org/W2167701463","https://openalex.org/W2110287964","https://openalex.org/W4307407935","https://openalex.org/W649759291"],"abstract_inverted_index":{"Cross-modal":[0],"content":[1,27,55,97,111,157],"generation":[2,28,56,98],"has":[3,29],"become":[4],"very":[5],"popular":[6],"in":[7,42,53,116,138,183],"recent":[8,51],"years.":[9],"To":[10],"generate":[11],"high-quality":[12],"and":[13,35,66,93,135,145,167],"realistic":[14],"content,":[15],"a":[16,69,114,178],"variety":[17],"of":[18,50,105,164,170],"methods":[19],"have":[20],"been":[21],"proposed.":[22],"Among":[23],"these":[24],"approaches,":[25],"visual":[26,54,96,156],"attracted":[30],"significant":[31],"attention":[32],"from":[33,158],"academia":[34],"industry":[36],"due":[37],"to":[38,75],"its":[39],"vast":[40],"potential":[41],"various":[43],"applications.":[44],"This":[45,174],"survey":[46,175],"provides":[47],"an":[48,102],"overview":[49],"advances":[52],"conditioned":[57],"on":[58,71],"other":[59,159],"modalities,":[60,166],"such":[61,141],"as":[62,142,177],"text,":[63],"audio,":[64],"speech,":[65],"music,":[67],"with":[68,127],"focus":[70],"their":[72],"key":[73],"contributions":[74],"the":[76,82,106,117,128,133,139,162,168],"community.":[77],"In":[78],"addition,":[79],"we":[80,131,149],"summarize":[81],"existing":[83,118],"publicly":[84],"available":[85],"datasets":[86,107],"that":[87],"can":[88],"be":[89],"used":[90,108],"for":[91,109,154,180],"training":[92],"benchmarking":[94],"cross-modal":[95],"models.":[99],"We":[100],"provide":[101],"in-depth":[103],"exploration":[104,163],"audio-to-visual":[110],"generation,":[112],"filling":[113],"gap":[115],"literature.":[119],"Various":[120],"evaluation":[121],"metrics":[122],"are":[123],"also":[124],"introduced":[125],"along":[126],"datasets.":[129],"Furthermore,":[130],"discuss":[132],"challenges":[134],"limitations":[136],"encountered":[137],"area,":[140],"modality":[143],"alignment":[144],"semantic":[146],"coherence.":[147],"Last,":[148],"outline":[150],"possible":[151],"future":[152],"directions":[153],"synthesizing":[155],"modalities":[160],"including":[161],"new":[165],"development":[169],"multi-task":[171],"multi-modal":[172],"networks.":[173],"serves":[176],"resource":[179],"researchers":[181],"interested":[182],"quickly":[184],"gaining":[185],"insights":[186],"into":[187],"this":[188],"burgeoning":[189],"field.":[190]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
