{"id":"https://openalex.org/W7133349437","doi":"https://doi.org/10.48550/arxiv.2603.01068","title":"LLaDA-o: An Effective and Length-Adaptive Omni Diffusion Model","display_name":"LLaDA-o: An Effective and Length-Adaptive Omni Diffusion Model","publication_year":2026,"publication_date":"2026-03-01","ids":{"openalex":"https://openalex.org/W7133349437","doi":"https://doi.org/10.48550/arxiv.2603.01068"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.01068","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01068","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.01068","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"You, Zebin","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"You, Zebin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127881576","display_name":"Xiaolu Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xiaolu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128012132","display_name":"Jun Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127940865","display_name":"Chongxuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chongxuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128009999","display_name":"Ji-Rong Wen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Ji-Rong","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.483599990606308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.483599990606308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.37450000643730164,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.01590000092983246,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.7610999941825867},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6478000283241272},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.5299999713897705},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5256999731063843},{"id":"https://openalex.org/keywords/coupling","display_name":"Coupling (piping)","score":0.5205000042915344},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4733999967575073}],"concepts":[{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.7610999941825867},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6557999849319458},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6478000283241272},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.5299999713897705},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5256999731063843},{"id":"https://openalex.org/C131584629","wikidata":"https://www.wikidata.org/wiki/Q4308705","display_name":"Coupling (piping)","level":2,"score":0.5205000042915344},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4733999967575073},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.41940000653266907},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.38449999690055847},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.37709999084472656},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37549999356269836},{"id":"https://openalex.org/C68710425","wikidata":"https://www.wikidata.org/wiki/Q5275442","display_name":"Diffusion process","level":3,"score":0.3215000033378601},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3010999858379364},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.2937000095844269},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.2791000008583069},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.2567000091075897},{"id":"https://openalex.org/C12426560","wikidata":"https://www.wikidata.org/wiki/Q189569","display_name":"Basis (linear algebra)","level":2,"score":0.2526000142097473}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.01068","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01068","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.01068","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01068","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"present":[1],"\\textbf{LLaDA-o},":[2],"an":[3],"effective":[4],"and":[5,13,33,46,92,95],"length-adaptive":[6],"omni":[7,108],"diffusion":[8,29,35,109],"model":[9],"for":[10,30,36,54,100],"multimodal":[11,73,90],"understanding":[12,32,91],"generation.":[14],"LLaDA-o":[15,82],"is":[16,112],"built":[17],"on":[18,58,89,98],"a":[19,43,63],"Mixture":[20],"of":[21,106],"Diffusion":[22],"(MoD)":[23],"framework":[24],"that":[25,50,68,81],"decouples":[26],"discrete":[27],"masked":[28],"text":[31],"continuous":[34],"visual":[37],"generation,":[38,102],"while":[39],"coupling":[40],"them":[41],"through":[42],"shared,":[44],"simple,":[45],"efficient":[47],"attention":[48],"backbone":[49],"reduces":[51],"redundant":[52],"computation":[53],"fixed":[55],"conditions.":[56],"Building":[57],"MoD,":[59],"we":[60],"further":[61],"introduce":[62],"data-centric":[64],"length":[65],"adaptation":[66],"strategy":[67],"enables":[69],"flexible-length":[70],"decoding":[71],"in":[72],"settings":[74],"without":[75],"architectural":[76],"changes.":[77],"Extensive":[78],"experiments":[79],"show":[80],"achieves":[83],"state-of-the-art":[84],"performance":[85],"among":[86],"omni-diffusion":[87],"models":[88],"generation":[93],"benchmarks,":[94],"reaches":[96],"87.04":[97],"DPG-Bench":[99],"text-to-image":[101],"supporting":[103],"the":[104],"effectiveness":[105],"unified":[107],"modeling.":[110],"Code":[111],"available":[113],"at":[114],"https://github.com/ML-GSAI/LLaDA-o.":[115]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-03-04T00:00:00"}
