{"id":"https://openalex.org/W7161298728","doi":"https://doi.org/10.48550/arxiv.2605.14874","title":"LPH-VTON: Resolving the Structure-Texture Dilemma of Virtual Try-On via Latent Process Handover","display_name":"LPH-VTON: Resolving the Structure-Texture Dilemma of Virtual Try-On via Latent Process Handover","publication_year":2026,"publication_date":"2026-05-14","ids":{"openalex":"https://openalex.org/W7161298728","doi":"https://doi.org/10.48550/arxiv.2605.14874"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.14874","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14874","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.14874","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136216377","display_name":"Yixin Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yixin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102690053","display_name":"Baihong Qian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Baihong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136232706","display_name":"Jinglin Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Jinglin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136198024","display_name":"Jeffery Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Jeffery","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136227075","display_name":"Yan Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136207333","display_name":"Wei Wang","orcid":"https://orcid.org/0000-0001-5788-6314"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136202355","display_name":"Yida Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yida","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084287163","display_name":"Lanqing Yang","orcid":"https://orcid.org/0000-0002-1551-224X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Lanqing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101490654","display_name":"Guangtao Xue","orcid":"https://orcid.org/0000-0002-1617-3593"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xue, Guangtao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.6902999877929688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.6902999877929688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.18060000240802765,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.07090000063180923,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.6198999881744385},{"id":"https://openalex.org/keywords/morphing","display_name":"Morphing","score":0.506600022315979},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.48510000109672546},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4740000069141388},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.367000013589859},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.34139999747276306},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.3264000117778778},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.3240000009536743}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7688999772071838},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.6198999881744385},{"id":"https://openalex.org/C50637493","wikidata":"https://www.wikidata.org/wiki/Q1136781","display_name":"Morphing","level":2,"score":0.506600022315979},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.48510000109672546},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4740000069141388},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.446399986743927},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.367000013589859},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.34139999747276306},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.3264000117778778},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3240000009536743},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3206000030040741},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.32030001282691956},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.302700012922287},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.29409998655319214},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.2858999967575073},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.2822999954223633},{"id":"https://openalex.org/C76956256","wikidata":"https://www.wikidata.org/wiki/Q27610560","display_name":"Process modeling","level":3,"score":0.2797999978065491},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.27399998903274536},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26840001344680786},{"id":"https://openalex.org/C83248878","wikidata":"https://www.wikidata.org/wiki/Q344000","display_name":"Active appearance model","level":3,"score":0.25609999895095825},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.25380000472068787},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.2533000111579895}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.14874","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14874","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.14874","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14874","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Virtual":[0],"Try-On":[1],"(VTON)":[2],"aims":[3],"to":[4,79,112,127],"synthesize":[5],"photorealistic":[6],"images":[7],"of":[8,42,167],"garments":[9],"precisely":[10],"aligned":[11],"with":[12],"a":[13,23,40,89,98,109,114,128,143],"person's":[14],"body":[15],"and":[16,29],"pose.":[17],"Current":[18],"diffusion-based":[19],"methods,":[20],"however,":[21],"face":[22],"fundamental":[24],"trade-off":[25],"between":[26],"structural":[27,80,157],"integrity":[28],"textural":[30],"fidelity.":[31],"In":[32],"this":[33,37,84,95],"paper,":[34],"we":[35,86],"formalize":[36],"challenge":[38],"as":[39],"consequence":[41],"complementary":[43],"inductive":[44],"biases":[45],"inherent":[46],"in":[47,119,150],"prevailing":[48],"architectures:":[49],"models":[50,65],"heavily":[51],"reliant":[52],"on":[53,83],"spatial":[54],"constraints":[55],"naturally":[56],"favor":[57],"geometric":[58],"alignment":[59,158],"but":[60,76],"often":[61],"suppress":[62],"textures,":[63],"whereas":[64],"dominated":[66],"by":[67],"unconstrained":[68],"generative":[69],"priors":[70],"excel":[71],"at":[72],"vibrant":[73],"detail":[74,133],"rendering":[75],"are":[77],"prone":[78],"drift.":[81],"Based":[82],"diagnosis,":[85],"propose":[87],"LPH-VTON,":[88],"new":[90,148],"synergistic":[91],"framework":[92],"that":[93],"resolves":[94],"tension":[96],"within":[97],"single,":[99],"continuous":[100],"denoising":[101],"process.":[102],"LPH-VTON":[103],"strategically":[104],"decomposes":[105],"the":[106,120,160,165],"generation,":[107],"leveraging":[108],"structure-biased":[110],"model":[111,130,141],"establish":[113],"geometrically":[115],"consistent":[116],"latent":[117],"scaffold":[118],"early":[121],"stages,":[122],"before":[123],"handing":[124],"over":[125],"control":[126],"texture-biased":[129],"for":[131],"high-fidelity":[132],"rendering.":[134],"Extensive":[135],"experiments":[136],"validate":[137],"our":[138],"approach.":[139],"Our":[140],"achieves":[142],"superior":[144],"Pareto-optimal":[145],"balance,":[146],"establishing":[147],"benchmarks":[149],"perceptual":[151],"faithfulness":[152],"while":[153],"maintaining":[154],"highly":[155],"competitive":[156],"across":[159],"standard":[161],"dataset":[162],"VITON-HD,":[163],"proving":[164],"efficacy":[166],"temporal":[168],"architectural":[169],"decoupling.":[170]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-16T00:00:00"}
