{"id":"https://openalex.org/W7154412806","doi":"https://doi.org/10.48550/arxiv.2604.10666","title":"Omnimodal Dataset Distillation via High-order Proxy Alignment","display_name":"Omnimodal Dataset Distillation via High-order Proxy Alignment","publication_year":2026,"publication_date":"2026-04-12","ids":{"openalex":"https://openalex.org/W7154412806","doi":"https://doi.org/10.48550/arxiv.2604.10666"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.10666","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.10666","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133626390","display_name":"Yuxuan Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gao, Yuxuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133620277","display_name":"Xiaohao Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiaohao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133553898","display_name":"Xiaobo Xia","orcid":"https://orcid.org/0000-0003-1720-7860"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xia, Xiaobo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133610523","display_name":"Tongliang Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Tongliang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5133626390"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6873999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6873999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.14149999618530273,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.039900001138448715,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.8119000196456909},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6535000205039978},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.6485000252723694},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5722000002861023},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.4138000011444092},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.39890000224113464},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3781999945640564},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.373199999332428},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.34850001335144043}],"concepts":[{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.8119000196456909},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.723800003528595},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6535000205039978},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.6485000252723694},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6134999990463257},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5722000002861023},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.4138000011444092},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4002000093460083},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.39890000224113464},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3781999945640564},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.373199999332428},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.34850001335144043},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.3465000092983246},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3353999853134155},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.3296999931335449},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.32670000195503235},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3262999951839447},{"id":"https://openalex.org/C66882249","wikidata":"https://www.wikidata.org/wiki/Q169336","display_name":"Homogeneous","level":2,"score":0.3138999938964844},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.31279999017715454},{"id":"https://openalex.org/C2780148112","wikidata":"https://www.wikidata.org/wiki/Q1432581","display_name":"Proxy (statistics)","level":2,"score":0.3018999993801117},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2567000091075897},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.25440001487731934},{"id":"https://openalex.org/C111696304","wikidata":"https://www.wikidata.org/wiki/Q2303697","display_name":"Sorting","level":2,"score":0.2515999972820282},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.25099998712539673},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.25060001015663147}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.10666","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.10666","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Partnerships for the goals","score":0.4439373314380646,"id":"https://metadata.un.org/sdg/17"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Dataset":[0,36],"distillation":[1,26,125,145],"compresses":[2],"large-scale":[3],"datasets":[4],"into":[5],"compact":[6,92],"synthetic":[7],"sets":[8],"while":[9],"preserving":[10],"training":[11],"performance,":[12],"but":[13],"existing":[14,163],"methods":[15],"are":[16],"largely":[17],"restricted":[18],"to":[19,27,43,162],"single-modal":[20],"or":[21],"bimodal":[22,143],"settings.":[23],"Extending":[24],"dataset":[25,144],"scenarios":[28],"involving":[29],"more":[30],"than":[31],"two":[32],"modalities,":[33],"i.e.,":[34],"Omnimodal":[35],"Distillation,":[37],"remains":[38],"underexplored":[39],"and":[40,46,121],"challenging":[41],"due":[42],"increased":[44],"heterogeneity":[45],"complex":[47],"cross-modal":[48,88],"interactions.":[49],"In":[50],"this":[51,77],"work,":[52],"we":[53,79],"identify":[54],"the":[55,60,64,114,132,136,154],"key":[56],"determinant":[57],"that":[58,85,153],"bounds":[59],"endpoint":[61],"discrepancy":[62],"in":[63],"omnimodal":[65,104],"setting,":[66],"which":[67,94],"is":[68,95],"exacerbated":[69],"with":[70,97,106],"an":[71],"increasing":[72],"number":[73],"of":[74,117,138],"modalities.":[75,128],"To":[76],"end,":[78],"propose":[80],"HoPA,":[81],"a":[82,91,107],"unified":[83],"method":[84,112,141,156],"captures":[86],"high-order":[87],"alignments":[89],"via":[90],"proxy,":[93],"compatible":[96],"trajectory":[98],"matching":[99],"as":[100],"well.":[101],"By":[102],"abstracting":[103],"alignment":[105],"shared":[108],"similarity":[109],"structure,":[110],"our":[111,139],"avoids":[113],"combinatorial":[115],"complexity":[116],"pairwise":[118],"modality":[119],"modeling":[120],"enables":[122],"scalable":[123],"joint":[124],"across":[126],"heterogeneous":[127],"Theoretical":[129],"analysis":[130],"from":[131],"spectral":[133],"perspective":[134],"reveals":[135],"rationality":[137],"proposed":[140,155],"against":[142],"techniques.":[146],"Extensive":[147],"experiments":[148],"on":[149],"various":[150],"benchmarks":[151],"demonstrate":[152],"achieves":[157],"superior":[158],"compression-performance":[159],"trade-offs":[160],"compared":[161],"competitors.":[164],"The":[165],"source":[166],"code":[167],"will":[168],"be":[169],"publicly":[170],"released.":[171]},"counts_by_year":[],"updated_date":"2026-04-15T06:04:33.058270","created_date":"2026-04-15T00:00:00"}
