{"id":"https://openalex.org/W7131120742","doi":"https://doi.org/10.48550/arxiv.2602.18055","title":"Continual-NExT: A Unified Comprehension And Generation Continual Learning Framework","display_name":"Continual-NExT: A Unified Comprehension And Generation Continual Learning Framework","publication_year":2026,"publication_date":"2026-02-20","ids":{"openalex":"https://openalex.org/W7131120742","doi":"https://doi.org/10.48550/arxiv.2602.18055"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.18055","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048803696","display_name":"Jingyang Qiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Qiao, Jingyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126657707","display_name":"Zhizhong Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zhizhong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126584693","display_name":"Xin Tan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tan, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074868631","display_name":"Jingyu Gong","orcid":"https://orcid.org/0000-0002-4536-0953"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gong, Jingyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123729470","display_name":"Yanyun Qu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qu, Yanyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126585760","display_name":"Yuan Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Yuan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5048803696"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.6517000198364258,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.6517000198364258,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.10100000351667404,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.02500000037252903,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5900999903678894},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.5573999881744385},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5554999709129333},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4810999929904938},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.41659998893737793},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.37709999084472656},{"id":"https://openalex.org/keywords/lifelong-learning","display_name":"Lifelong learning","score":0.3693000078201294},{"id":"https://openalex.org/keywords/active-learning","display_name":"Active learning (machine learning)","score":0.366100013256073}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.753600001335144},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5900999903678894},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.585099995136261},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.5573999881744385},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5554999709129333},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4810999929904938},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.41659998893737793},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.37709999084472656},{"id":"https://openalex.org/C108771440","wikidata":"https://www.wikidata.org/wiki/Q368475","display_name":"Lifelong learning","level":2,"score":0.3693000078201294},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.366100013256073},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3434999883174896},{"id":"https://openalex.org/C12298181","wikidata":"https://www.wikidata.org/wiki/Q7246814","display_name":"Proactive learning","level":5,"score":0.3165999948978424},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.30820000171661377},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2996000051498413},{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C2776960227","wikidata":"https://www.wikidata.org/wiki/Q2586354","display_name":"Knowledge transfer","level":2,"score":0.2736000120639801},{"id":"https://openalex.org/C2780735816","wikidata":"https://www.wikidata.org/wiki/Q28324931","display_name":"Incremental learning","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.26649999618530273},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2563999891281128},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.25110000371932983}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.18055","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.18055","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.18055","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.18055","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.4254097044467926,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Dual-to-Dual":[0,29,63,85,107,120],"MLLMs":[1,30,64,86,108],"refer":[2],"to":[3,41,137],"Multimodal":[4],"Large":[5],"Language":[6],"Models,":[7],"which":[8],"can":[9],"enable":[10],"unified":[11],"multimodal":[12],"comprehension":[13],"and":[14,18,26,72,128,133,144,157],"generation":[15],"through":[16],"text":[17],"image":[19],"modalities.":[20],"Although":[21],"exhibiting":[22],"strong":[23],"instantaneous":[24],"learning":[25,51,82,104,117,155],"generalization":[27],"capabilities,":[28],"still":[31],"remain":[32],"deficient":[33],"in":[34,74,96],"lifelong":[35],"evolution,":[36],"significantly":[37],"affecting":[38],"continual":[39,81,103,116,154],"adaptation":[40],"dynamic":[42],"real-world":[43],"scenarios.":[44],"One":[45],"of":[46,119,130],"the":[47,56,115],"challenges":[48,93],"is":[49],"that":[50,150],"new":[52],"tasks":[53],"inevitably":[54],"destroys":[55],"learned":[57],"knowledge.":[58],"Beyond":[59],"traditional":[60],"catastrophic":[61],"forgetting,":[62],"face":[65],"other":[66,153],"challenges,":[67],"including":[68],"hallucination,":[69],"instruction":[70],"unfollowing,":[71],"failures":[73],"cross-modal":[75],"knowledge":[76,140],"transfer.":[77],"However,":[78],"no":[79],"standardized":[80],"framework":[83,105],"for":[84,106],"has":[87],"been":[88],"established":[89],"yet,":[90],"leaving":[91],"these":[92],"unexplored.":[94],"Thus,":[95],"this":[97],"paper,":[98],"we":[99,122],"establish":[100],"Continual-NExT,":[101],"a":[102],"with":[109],"deliberately-architected":[110],"evaluation":[111],"metrics.":[112],"To":[113],"improve":[114],"capability":[118],"MLLMs,":[121],"propose":[123],"an":[124],"efficient":[125],"MAGE":[126,151],"(Mixture":[127],"Aggregation":[129],"General":[131],"LoRA":[132],"Expert":[134],"LoRA)":[135],"method":[136],"further":[138],"facilitate":[139],"transfer":[141],"across":[142],"modalities":[143],"mitigate":[145],"forgetting.":[146],"Extensive":[147],"experiments":[148],"demonstrate":[149],"outperforms":[152],"methods":[156],"achieves":[158],"state-of-the-art":[159],"performance.":[160]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-24T00:00:00"}
