{"id":"https://openalex.org/W7130708562","doi":"https://doi.org/10.48550/arxiv.2602.17636","title":"CORAL: Correspondence Alignment for Improved Virtual Try-On","display_name":"CORAL: Correspondence Alignment for Improved Virtual Try-On","publication_year":2026,"publication_date":"2026-02-19","ids":{"openalex":"https://openalex.org/W7130708562","doi":"https://doi.org/10.48550/arxiv.2602.17636"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.17636","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126511004","display_name":"Jiyoung Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kim, Jiyoung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126462267","display_name":"Youngjin Shin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shin, Youngjin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102637406","display_name":"Siyoon Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Siyoon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121257318","display_name":"Dahyun Chung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chung, Dahyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126505295","display_name":"Jisu Nam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nam, Jisu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126498317","display_name":"Tongmin Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Tongmin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126481096","display_name":"Jongjae Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Jongjae","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109512628","display_name":"Hyeon-Woo Kang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kang, Hyeonwoo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126449464","display_name":"Seungryong Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Seungryong","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5126511004"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.7961999773979187,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.7961999773979187,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.0763000026345253,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.05180000141263008,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/correspondence-problem","display_name":"Correspondence problem","score":0.6711999773979187},{"id":"https://openalex.org/keywords/minification","display_name":"Minification","score":0.5393000245094299},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.4537999927997589},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.45249998569488525},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.3659999966621399},{"id":"https://openalex.org/keywords/feature-matching","display_name":"Feature matching","score":0.3456000089645386},{"id":"https://openalex.org/keywords/image-matching","display_name":"Image matching","score":0.32199999690055847},{"id":"https://openalex.org/keywords/correspondence-analysis","display_name":"Correspondence analysis","score":0.3192000091075897}],"concepts":[{"id":"https://openalex.org/C3004257","wikidata":"https://www.wikidata.org/wiki/Q17084606","display_name":"Correspondence problem","level":2,"score":0.6711999773979187},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6376000046730042},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5956000089645386},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.5393000245094299},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.4537999927997589},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.45249998569488525},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4510999917984009},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3659999966621399},{"id":"https://openalex.org/C2983787585","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature matching","level":3,"score":0.3456000089645386},{"id":"https://openalex.org/C2986492983","wikidata":"https://www.wikidata.org/wiki/Q861092","display_name":"Image matching","level":3,"score":0.32199999690055847},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3215000033378601},{"id":"https://openalex.org/C148298330","wikidata":"https://www.wikidata.org/wiki/Q1784754","display_name":"Correspondence analysis","level":2,"score":0.3192000091075897},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3167000114917755},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.30970001220703125},{"id":"https://openalex.org/C167981619","wikidata":"https://www.wikidata.org/wiki/Q1685498","display_name":"Cross entropy","level":3,"score":0.3034000098705292},{"id":"https://openalex.org/C171752962","wikidata":"https://www.wikidata.org/wiki/Q255166","display_name":"Kullback\u2013Leibler divergence","level":2,"score":0.2930000126361847},{"id":"https://openalex.org/C160697094","wikidata":"https://www.wikidata.org/wiki/Q1233197","display_name":"Oblique case","level":2,"score":0.2750000059604645},{"id":"https://openalex.org/C2780297707","wikidata":"https://www.wikidata.org/wiki/Q4895393","display_name":"Landmark","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2727999985218048},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.27059999108314514},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.25769999623298645}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.17636","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.17636","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.17636","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.17636","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Existing":[0],"methods":[1,24],"for":[2],"Virtual":[3],"Try-On":[4],"(VTON)":[5],"often":[6],"struggle":[7],"to":[8,33,127],"preserve":[9],"fine":[10],"garment":[11],"details,":[12],"especially":[13],"in":[14,51],"unpaired":[15],"settings":[16],"where":[17],"accurate":[18],"person-garment":[19,29,58,64,108],"correspondence":[20,36,59,100],"is":[21],"required.":[22],"These":[23],"do":[25],"not":[26],"explicitly":[27,86],"enforce":[28],"alignment":[30],"and":[31,54,110,143],"fail":[32],"explain":[34],"how":[35],"emerges":[37],"within":[38,67],"Diffusion":[39],"Transformers":[40],"(DiTs).":[41],"In":[42],"this":[43,74],"paper,":[44],"we":[45,76],"first":[46],"analyze":[47],"full":[48,69],"3D":[49,70],"attention":[50,118],"DiT-based":[52,83],"architecture":[53],"reveal":[55],"that":[56,85,103,115],"the":[57,68,117,136],"critically":[60],"depends":[61],"on":[62,73],"precise":[63],"query-key":[65,88],"matching":[66,89],"attention.":[71],"Building":[72],"insight,":[75],"then":[77],"introduce":[78],"CORrespondence":[79],"ALignment":[80],"(CORAL),":[81],"a":[82,99,123],"framework":[84],"aligns":[87,104],"with":[90,107],"robust":[91],"external":[92],"correspondences.":[93],"CORAL":[94,132],"integrates":[95],"two":[96],"complementary":[97],"components:":[98],"distillation":[101],"loss":[102,114],"reliable":[105],"matches":[106],"attention,":[109],"an":[111],"entropy":[112],"minimization":[113],"sharpens":[116],"distribution.":[119],"We":[120],"further":[121],"propose":[122],"VLM-based":[124],"evaluation":[125],"protocol":[126],"better":[128],"reflect":[129],"human":[130],"preference.":[131],"consistently":[133],"improves":[134],"over":[135],"baseline,":[137],"enhancing":[138],"both":[139],"global":[140],"shape":[141],"transfer":[142],"local":[144],"detail":[145],"preservation.":[146],"Extensive":[147],"ablations":[148],"validate":[149],"our":[150],"design":[151],"choices.":[152]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-21T00:00:00"}
