{"id":"https://openalex.org/W7153206356","doi":"https://doi.org/10.48550/arxiv.2604.07753","title":"Symbiotic-MoE: Unlocking the Synergy between Generation and Understanding","display_name":"Symbiotic-MoE: Unlocking the Synergy between Generation and Understanding","publication_year":2026,"publication_date":"2026-04-09","ids":{"openalex":"https://openalex.org/W7153206356","doi":"https://doi.org/10.48550/arxiv.2604.07753"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.07753","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07753","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.07753","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064432806","display_name":"Xiangyue Liu","orcid":"https://orcid.org/0000-0003-4463-8068"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Liu, Xiangyue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133392618","display_name":"Zijian Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zijian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133389133","display_name":"Miles Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Miles","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133356329","display_name":"Zhao Zhong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhong, Zhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133328815","display_name":"Liefeng Bo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bo, Liefeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133319354","display_name":"Ping Tan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tan, Ping","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5064432806"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.5604000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.5604000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.34619998931884766,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.019300000742077827,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.7146000266075134},{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.4424999952316284},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4147000014781952},{"id":"https://openalex.org/keywords/constructive","display_name":"Constructive","score":0.39309999346733093},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.373199999332428},{"id":"https://openalex.org/keywords/generative-design","display_name":"Generative Design","score":0.3610999882221222}],"concepts":[{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.7146000266075134},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6973000168800354},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5576000213623047},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.4424999952316284},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.43799999356269836},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4147000014781952},{"id":"https://openalex.org/C2778701210","wikidata":"https://www.wikidata.org/wiki/Q28130034","display_name":"Constructive","level":3,"score":0.39309999346733093},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.373199999332428},{"id":"https://openalex.org/C184408114","wikidata":"https://www.wikidata.org/wiki/Q1502022","display_name":"Generative Design","level":3,"score":0.3610999882221222},{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.3601999878883362},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.3531000018119812},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.3321000039577484},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3107999861240387},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.2662999927997589},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.2660999894142151}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.07753","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07753","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.07753","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07753","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Empowering":[0],"Large":[1],"Multimodal":[2],"Models":[3],"(LMMs)":[4],"with":[5,65,179],"image":[6],"generation":[7],"often":[8],"leads":[9,75],"to":[10,17,76,114,122],"catastrophic":[11],"forgetting":[12],"in":[13],"understanding":[14,178],"tasks":[15,121],"due":[16],"severe":[18],"gradient":[19,141],"conflicts.":[20],"While":[21],"existing":[22],"paradigms":[23],"like":[24],"Mixture-of-Transformers":[25],"(MoT)":[26],"mitigate":[27],"this":[28,44,109],"conflict":[29],"through":[30],"structural":[31],"isolation,":[32],"they":[33],"fundamentally":[34],"sever":[35],"cross-modal":[36,174],"synergy":[37],"and":[38,139,184],"suffer":[39],"from":[40,119,150],"capacity":[41],"fragmentation.":[42],"In":[43],"work,":[45],"we":[46,88,129],"present":[47],"Symbiotic-MoE,":[48],"a":[49,58,104,131],"unified":[50],"pre-training":[51],"framework":[52],"that":[53,71,166],"resolves":[54],"task":[55],"interference":[56],"within":[57],"native":[59],"multimodal":[60,105],"Mixture-of-Experts":[61],"(MoE)":[62],"Transformers":[63],"architecture":[64],"zero-parameter":[66],"overhead.":[67],"We":[68],"first":[69],"identify":[70],"standard":[72],"MoE":[73],"tuning":[74],"routing":[77],"collapse,":[78],"where":[79],"generative":[80,120,156,170],"gradients":[81],"dominate":[82],"expert":[83],"utilization.":[84],"To":[85,126],"address":[86],"this,":[87,128],"introduce":[89],"Modality-Aware":[90],"Expert":[91],"Disentanglement,":[92],"which":[93],"partitions":[94],"experts":[95,102,113],"into":[96,158],"task-specific":[97],"groups":[98],"while":[99,172],"utilizing":[100],"shared":[101,112],"as":[103],"semantic":[106],"bridge.":[107],"Crucially,":[108],"design":[110],"allows":[111],"absorb":[115],"fine-grained":[116],"visual":[117],"semantics":[118],"enrich":[123],"textual":[124],"representations.":[125],"optimize":[127],"propose":[130],"Progressive":[132],"Training":[133],"Strategy":[134],"featuring":[135],"differential":[136],"learning":[137],"rates":[138],"early-stage":[140],"shielding.":[142],"This":[143],"mechanism":[144],"not":[145],"only":[146],"shields":[147],"pre-trained":[148],"knowledge":[149],"early":[151],"volatility":[152],"but":[153],"eventually":[154],"transforms":[155],"signals":[157],"constructive":[159],"feedback":[160],"for":[161],"understanding.":[162],"Extensive":[163],"experiments":[164],"demonstrate":[165],"Symbiotic-MoE":[167],"achieves":[168],"rapid":[169],"convergence":[171],"unlocking":[173],"synergy,":[175],"boosting":[176],"inherent":[177],"remarkable":[180],"gains":[181],"on":[182],"MMLU":[183],"OCRBench.":[185]},"counts_by_year":[],"updated_date":"2026-04-11T06:19:08.300824","created_date":"2026-04-11T00:00:00"}
