{"id":"https://openalex.org/W4417009993","doi":"https://doi.org/10.48550/arxiv.2512.02781","title":"LumiX: Structured and Coherent Text-to-Intrinsic Generation","display_name":"LumiX: Structured and Coherent Text-to-Intrinsic Generation","publication_year":2025,"publication_date":"2025-12-02","ids":{"openalex":"https://openalex.org/W4417009993","doi":"https://doi.org/10.48550/arxiv.2512.02781"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2512.02781","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.02781","pdf_url":"https://arxiv.org/pdf/2512.02781","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2512.02781","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100668503","display_name":"Xu Han","orcid":"https://orcid.org/0000-0002-4726-7621"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Han, Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100363708","display_name":"Biao Zhang","orcid":"https://orcid.org/0000-0001-6305-838X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Biao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087452083","display_name":"Xiangjun Tang","orcid":"https://orcid.org/0000-0001-7441-0086"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Xiangjun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101763340","display_name":"Xianzhi Li","orcid":"https://orcid.org/0000-0002-0231-720X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xianzhi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5076768552","display_name":"Peter Wonka","orcid":"https://orcid.org/0000-0003-0627-9746"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wonka, Peter","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100668503"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.6740000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.6740000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1363999992609024,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.024399999529123306,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2512.02781","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.02781","pdf_url":"https://arxiv.org/pdf/2512.02781","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2512.02781","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.02781","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2512.02781","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.02781","pdf_url":"https://arxiv.org/pdf/2512.02781","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"present":[1],"LumiX,":[2],"a":[3,18,33,53,72,114],"structured":[4,34],"diffusion":[5,90],"framework":[6],"for":[7,80],"coherent":[8,104],"text-to-intrinsic":[9],"generation.":[10],"Conditioned":[11],"on":[12],"text":[13],"prompts,":[14],"LumiX":[15,102],"jointly":[16],"generates":[17],"comprehensive":[19],"set":[20],"of":[21,39,95,125],"intrinsic":[22,97,134],"maps":[23,64],"(e.g.,":[24],"albedo,":[25],"irradiance,":[26],"normal,":[27],"depth,":[28],"and":[29,35,92,105,113,128],"final":[30],"color),":[31],"providing":[32],"physically":[36,106],"consistent":[37],"description":[38],"an":[40],"underlying":[41],"scene.":[42],"This":[43],"is":[44],"enabled":[45],"by":[46,59],"two":[47],"key":[48],"contributions:":[49],"1)":[50],"Query-Broadcast":[51],"Attention,":[52],"mechanism":[54],"that":[55,75,101],"ensures":[56],"structural":[57],"consistency":[58],"sharing":[60],"queries":[61],"across":[62],"all":[63],"in":[65],"each":[66],"self-attention":[67],"block.":[68],"2)":[69],"Tensor":[70],"LoRA,":[71],"tensor-based":[73],"adaptation":[74],"parameter-efficiently":[76],"models":[77],"cross-map":[78],"relations":[79],"efficient":[81],"joint":[82,89],"training.":[83],"Together,":[84],"these":[85],"designs":[86],"enable":[87],"stable":[88],"training":[91],"unified":[93],"generation":[94],"multiple":[96],"properties.":[98],"Experiments":[99],"show":[100],"produces":[103],"meaningful":[107],"results,":[108],"achieving":[109],"23%":[110],"higher":[111],"alignment":[112],"better":[115],"preference":[116],"score":[117],"(0.19":[118],"vs.":[119],"-0.41)":[120],"compared":[121],"to":[122],"the":[123,126,137],"state":[124],"art,":[127],"it":[129],"can":[130],"also":[131],"perform":[132],"image-conditioned":[133],"decomposition":[135],"within":[136],"same":[138],"framework.":[139]},"counts_by_year":[],"updated_date":"2026-03-03T08:47:05.690250","created_date":"2025-12-04T00:00:00"}
