{"id":"https://openalex.org/W7137876972","doi":"https://doi.org/10.1609/aaai.v40i18.38582","title":"ImageBindDC: Compressing Multi-modal Data with ImageBind-based Condensation","display_name":"ImageBindDC: Compressing Multi-modal Data with ImageBind-based Condensation","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7137876972","doi":"https://doi.org/10.1609/aaai.v40i18.38582"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i18.38582","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i18.38582","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1609/aaai.v40i18.38582","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129729439","display_name":"Yue Min","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yue Min","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129746191","display_name":"Shaobo Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shaobo Wang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129675738","display_name":"Jiaze Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiaze Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114097318","display_name":"Tianle Niu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tianle Niu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055093770","display_name":"Ji Fan","orcid":"https://orcid.org/0000-0001-5774-0059"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Junxin Fan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Yongliang Miao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yongliang Miao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006040497","display_name":"Lijin Yang","orcid":"https://orcid.org/0000-0003-3787-6658"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lijin Yang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129642313","display_name":"Linfeng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Linfeng Zhang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5129729439"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10761347,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"18","first_page":"15537","last_page":"15545"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.763700008392334,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.763700008392334,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.05770000070333481,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.0575999990105629,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5026000142097473},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.47530001401901245},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.41690000891685486},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4129999876022339},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.4108999967575073},{"id":"https://openalex.org/keywords/condensation","display_name":"Condensation","score":0.3831000030040741},{"id":"https://openalex.org/keywords/lossless-compression","display_name":"Lossless compression","score":0.3797999918460846},{"id":"https://openalex.org/keywords/statistical-model","display_name":"Statistical model","score":0.37139999866485596},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.3677999973297119},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.35499998927116394}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6011999845504761},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.550599992275238},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5026000142097473},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.47530001401901245},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.41690000891685486},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4129999876022339},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.4108999967575073},{"id":"https://openalex.org/C200093464","wikidata":"https://www.wikidata.org/wiki/Q166583","display_name":"Condensation","level":2,"score":0.3831000030040741},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.3797999918460846},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.37139999866485596},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.3677999973297119},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.35499998927116394},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.3483999967575073},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3467999994754791},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33320000767707825},{"id":"https://openalex.org/C18653775","wikidata":"https://www.wikidata.org/wiki/Q1333358","display_name":"Joint probability distribution","level":2,"score":0.3190999925136566},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.3179999887943268},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.3109000027179718},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.30869999527931213},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.30239999294281006},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.30160000920295715},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.28859999775886536},{"id":"https://openalex.org/C53533937","wikidata":"https://www.wikidata.org/wiki/Q185020","display_name":"Histogram","level":3,"score":0.28439998626708984},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.28119999170303345},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C110121322","wikidata":"https://www.wikidata.org/wiki/Q865811","display_name":"Distribution (mathematics)","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.2757999897003174},{"id":"https://openalex.org/C179254644","wikidata":"https://www.wikidata.org/wiki/Q13222844","display_name":"Moment (physics)","level":2,"score":0.2743000090122223},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.26829999685287476},{"id":"https://openalex.org/C123122884","wikidata":"https://www.wikidata.org/wiki/Q371730","display_name":"Well-defined","level":2,"score":0.2635999917984009},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.2624000012874603},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2556999921798706},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.2526000142097473},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.25220000743865967},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2517000138759613},{"id":"https://openalex.org/C73586568","wikidata":"https://www.wikidata.org/wiki/Q2600211","display_name":"Parameter space","level":2,"score":0.2515999972820282},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i18.38582","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i18.38582","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i18.38582","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i18.38582","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Data":[0],"condensation":[1,46,207],"techniques":[2],"aim":[3],"to":[4,13,76,92,181],"synthesize":[5],"a":[6,10,43,64,78,167,189],"compact":[7],"dataset":[8],"from":[9],"larger":[11],"one":[12,182],"enable":[14],"efficient":[15],"model":[16,168],"training,":[17],"yet":[18],"while":[19],"successful":[20],"in":[21,27,72],"unimodal":[22],"settings,":[23],"they":[24],"often":[25],"fail":[26],"multimodal":[28],"scenarios":[29],"where":[30],"preserving":[31],"intricate":[32],"inter-modal":[33],"dependencies":[34],"is":[35],"crucial.":[36],"To":[37],"address":[38],"this,":[39],"we":[40],"introduce":[41],"ImageBindDC,":[42],"novel":[44],"data":[45,112,130,141,150],"framework":[47],"operating":[48],"within":[49,113],"the":[50,73,105,125,138,145,159,164,185,198],"unified":[51],"feature":[52],"space":[53],"of":[54,97,108,127,148,161],"ImageBind.":[55],"Our":[56],"approach":[57],"moves":[58],"beyond":[59],"conventional":[60],"distribution-matching":[61],"by":[62,123,143],"employing":[63],"powerful":[65],"Characteristic":[66],"Function":[67],"(CF)":[68],"loss,":[69],"which":[70,103,119,136],"operates":[71],"Fourier":[74],"domain":[75],"facilitate":[77],"more":[79,203],"precise":[80],"statistical":[81,106],"alignment":[82],"via":[83],"exact":[84],"infinite":[85],"moment":[86],"matching.":[87],"We":[88],"design":[89],"our":[90],"objective":[91],"enforce":[93],"three":[94],"critical":[95],"levels":[96],"distributional":[98],"consistency:":[99],"(i)":[100],"uni-modal":[101],"alignment,":[102,118,135],"matches":[104],"properties":[107],"synthetic":[109,154],"and":[110,132,202],"real":[111,149],"each":[114],"modality;":[115],"(ii)":[116],"cross-modal":[117],"preserves":[120],"pairwise":[121],"semantics":[122],"matching":[124],"distributions":[126],"hybrid":[128],"real-synthetic":[129],"pairs;":[131],"(iii)":[133],"joint-modal":[134],"captures":[137],"complete":[139],"multivariate":[140],"structure":[142],"aligning":[144],"joint":[146],"distribution":[147],"pairs":[151],"with":[152,192],"their":[153],"counterparts.":[155],"Extensive":[156],"experiments":[157],"highlight":[158],"effectiveness":[160],"ImageBindDC:":[162],"on":[163,170,184],"NYU-v2":[165],"dataset,":[166,187],"trained":[169,183],"just":[171],"5":[172],"condensed":[173],"datapoints":[174],"per":[175],"class":[176],"achieves":[177],"lossless":[178],"performance":[179],"comparable":[180],"full":[186],"achieving":[188],"new":[190],"state-of-the-art":[191],"an":[193],"8.2%":[194],"absolute":[195],"improvement":[196],"over":[197],"previous":[199],"best":[200],"method":[201],"than":[204],"4\u00d7":[205],"less":[206],"time.":[208]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2026-03-18T00:00:00"}
