{"id":"https://openalex.org/W4414360124","doi":"https://doi.org/10.24963/ijcai.2025/105","title":"Mask Does Not Matter: A Unified Latent Diffusion-Enhanced Framework for Mask-Free Virtual Try-On","display_name":"Mask Does Not Matter: A Unified Latent Diffusion-Enhanced Framework for Mask-Free Virtual Try-On","publication_year":2025,"publication_date":"2025-09-01","ids":{"openalex":"https://openalex.org/W4414360124","doi":"https://doi.org/10.24963/ijcai.2025/105"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2025/105","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/105","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054459288","display_name":"Chenghu Du","orcid":"https://orcid.org/0000-0001-7275-5064"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chenghu Du","raw_affiliation_strings":["School of Computer Science and Artificial Intelligence, Wuhan University of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Artificial Intelligence, Wuhan University of Technology","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103265176","display_name":"Junyin Wang","orcid":"https://orcid.org/0009-0008-5845-3615"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junyin Wang","raw_affiliation_strings":["School of Computer Science and Artificial Intelligence, Wuhan University of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Artificial Intelligence, Wuhan University of Technology","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100399811","display_name":"Kai Liu","orcid":"https://orcid.org/0000-0001-7252-5939"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Liu","raw_affiliation_strings":["School of Computer Science and Artificial Intelligence, Wuhan University of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Artificial Intelligence, Wuhan University of Technology","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011707621","display_name":"Shengwu Xiong","orcid":"https://orcid.org/0000-0002-4006-7029"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210100789","display_name":"Wuhan College","ror":"https://ror.org/01dashf18","country_code":"CN","type":"nonprofit","lineage":["https://openalex.org/I4210100789"]},{"id":"https://openalex.org/I4391012619","display_name":"Shanghai Artificial Intelligence Laboratory","ror":"https://ror.org/03wkvpx79","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391012619"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengwu Xiong","raw_affiliation_strings":["Interdisciplinary Artificial Intelligence Research Institute, Wuhan College","Shanghai Artificial Intelligence Laboratory"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Interdisciplinary Artificial Intelligence Research Institute, Wuhan College","institution_ids":["https://openalex.org/I4210100789"]},{"raw_affiliation_string":"Shanghai Artificial Intelligence Laboratory","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4391012619"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101967703","display_name":"Yi Rong","orcid":"https://orcid.org/0000-0003-4867-6811"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Rong","raw_affiliation_strings":["Sanya Science and Education Innovation Park, Wuhan University of Technology","School of Computer Science and Artificial Intelligence, Wuhan University of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sanya Science and Education Innovation Park, Wuhan University of Technology","institution_ids":["https://openalex.org/I196699116"]},{"raw_affiliation_string":"School of Computer Science and Artificial Intelligence, Wuhan University of Technology","institution_ids":["https://openalex.org/I196699116"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5054459288"],"corresponding_institution_ids":["https://openalex.org/I196699116"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21951147,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"936","last_page":"944"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9395999908447266,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9395999908447266,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9265000224113464,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.66839998960495},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6115999817848206},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5378999710083008},{"id":"https://openalex.org/keywords/randomness","display_name":"Randomness","score":0.48089998960494995},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4544000029563904},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4081999957561493},{"id":"https://openalex.org/keywords/inpainting","display_name":"Inpainting","score":0.39340001344680786},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.366100013256073}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7330999970436096},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.66839998960495},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6115999817848206},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5824000239372253},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5378999710083008},{"id":"https://openalex.org/C125112378","wikidata":"https://www.wikidata.org/wiki/Q176640","display_name":"Randomness","level":2,"score":0.48089998960494995},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4578999876976013},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4544000029563904},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4081999957561493},{"id":"https://openalex.org/C11727466","wikidata":"https://www.wikidata.org/wiki/Q1628157","display_name":"Inpainting","level":3,"score":0.39340001344680786},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.366100013256073},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.35339999198913574},{"id":"https://openalex.org/C50494287","wikidata":"https://www.wikidata.org/wiki/Q658467","display_name":"Texture synthesis","level":5,"score":0.34450000524520874},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34119999408721924},{"id":"https://openalex.org/C2911011789","wikidata":"https://www.wikidata.org/wiki/Q130741","display_name":"Hallucinating","level":2,"score":0.3140999972820282},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.298799991607666},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2971000075340271},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.2913999855518341},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.28060001134872437},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2720000147819519},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.2712000012397766},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.24963/ijcai.2025/105","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/105","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"A":[0],"good":[1],"virtual":[2,83,196],"try-on":[3,197],"model":[4,69,139,161],"should":[5],"introduce":[6,151],"minimal":[7],"redundant":[8],"conditional":[9,63],"information":[10,111],"to":[11,24,47,65,93,116,123,136,140,157,162,175],"avoid":[12],"instability":[13,70],"and":[14,58,71,101,109,119],"increase":[15],"inference":[16,173],"efficiency.":[17,73],"Existing":[18],"methods":[19],"rely":[20],"on":[21,142,187],"inpainting":[22],"masks":[23],"guide":[25],"the":[26,29,32,76,113,125,138,160,177,181],"generation":[27,144],"of":[28,180],"object,":[30],"but":[31],"masks,":[33],"generated":[34,126],"by":[35],"unstable":[36],"human":[37],"parsers,":[38],"often":[39],"produce":[40],"unreliable":[41],"results":[42],"with":[43,145],"fabric":[44],"residues":[45],"due":[46],"wrong":[48],"segmentation.":[49],"Moreover,":[50],"large":[51],"mask":[52],"regions":[53],"can":[54],"lose":[55],"spatial":[56,107],"structure":[57,108],"identity":[59,110],"information,":[60],"requiring":[61],"extra":[62],"inputs":[64],"compensate,":[66],"which":[67],"increases":[68],"reduces":[72],"To":[74],"tackle":[75],"problem,":[77],"we":[78,88,129,168],"present":[79],"a":[80,90,131,152],"novel":[81],"Mask-Free":[82],"Try-ON":[84],"(MFTON)":[85],"framework.":[86],"Specifically,":[87],"propose":[89,130,169],"mask-free":[91],"strategy":[92],"eliminate":[94],"all":[95],"denoising":[96],"conditions":[97],"except":[98],"for":[99],"clothing":[100,127,132],"person":[102,114],"images,":[103],"thereby":[104],"directly":[105],"extracting":[106],"from":[112],"image":[115],"improve":[117],"efficiency":[118],"reduce":[120,176],"instability.":[121],"Additionally,":[122],"optimize":[124],"regions,":[128],"texture-aware":[133],"attention":[134],"mechanism":[135],"enable":[137,159],"focus":[141],"texture":[143],"significant":[146],"visual":[147],"differences.":[148],"We":[149],"then":[150],"geometric":[153],"detail":[154],"capture":[155,163],"loss":[156],"further":[158],"more":[164],"high-frequency":[165],"information.":[166],"Finally,":[167],"an":[170],"appearance":[171],"consistency":[172],"method":[174,193],"initial":[178],"randomness":[179],"sampling":[182],"process":[183],"significantly.":[184],"Extensive":[185],"experiments":[186],"popular":[188],"datasets":[189],"demonstrate":[190],"that":[191],"our":[192],"outperforms":[194],"state-of-the-art":[195],"methods.":[198]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
