{"id":"https://openalex.org/W4402981855","doi":"https://doi.org/10.1109/icme57554.2024.10688255","title":"DNAF: Diffusion with Noise-Aware Feature for Pose-Guided Person Image Synthesis","display_name":"DNAF: Diffusion with Noise-Aware Feature for Pose-Guided Person Image Synthesis","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4402981855","doi":"https://doi.org/10.1109/icme57554.2024.10688255"},"language":"en","primary_location":{"id":"doi:10.1109/icme57554.2024.10688255","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icme57554.2024.10688255","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100900799","display_name":"Guo Li-yan","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Liyan Guo","raw_affiliation_strings":["Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049156119","display_name":"Kaiyu Song","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaiyu Song","raw_affiliation_strings":["Sun Yat-sen University,School of Artificial Intelligence,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Artificial Intelligence,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102008835","display_name":"Mengying Xu","orcid":"https://orcid.org/0000-0003-1862-6709"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengying Xu","raw_affiliation_strings":["Sun Yat-sen University,School of Systems Science and Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Systems Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076868018","display_name":"Hanjiang Lai","orcid":"https://orcid.org/0000-0001-8057-6744"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanjiang Lai","raw_affiliation_strings":["Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100900799"],"corresponding_institution_ids":["https://openalex.org/I157773358"],"apc_list":null,"apc_paid":null,"fwci":0.2632,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.54393264,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6936743855476379},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6862096786499023},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.6121683716773987},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6041477918624878},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5797824263572693},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.515805721282959},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.5122761130332947},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.060655415058135986}],"concepts":[{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6936743855476379},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6862096786499023},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.6121683716773987},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6041477918624878},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5797824263572693},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.515805721282959},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.5122761130332947},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.060655415058135986},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme57554.2024.10688255","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icme57554.2024.10688255","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"id":"https://metadata.un.org/sdg/5","display_name":"Gender equality"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2204750386","https://openalex.org/W2471768434","https://openalex.org/W2559085405","https://openalex.org/W2962785568","https://openalex.org/W2963266880","https://openalex.org/W2964002510","https://openalex.org/W3034950620","https://openalex.org/W3035515747","https://openalex.org/W3138516171","https://openalex.org/W3176412779","https://openalex.org/W3180675665","https://openalex.org/W4312881655","https://openalex.org/W4312896571","https://openalex.org/W4312933868","https://openalex.org/W4313030876","https://openalex.org/W4386072096","https://openalex.org/W4386076520","https://openalex.org/W4390873030","https://openalex.org/W4390873194","https://openalex.org/W4393148714","https://openalex.org/W4402727926"],"related_works":["https://openalex.org/W3147584709","https://openalex.org/W2977677679","https://openalex.org/W1992327129","https://openalex.org/W2381986121","https://openalex.org/W2370918718","https://openalex.org/W2256933480","https://openalex.org/W2755342338","https://openalex.org/W2027854990","https://openalex.org/W2775347418","https://openalex.org/W2370081953"],"abstract_inverted_index":{"Pose-guided":[0],"person":[1],"image":[2],"synthesis":[3],"aims":[4],"at":[5],"generating":[6],"images":[7],"based":[8],"on":[9,136],"the":[10,15,26,39,57,65,69,84,90,93,97,109,115,125],"related":[11],"pose":[12,42,50,86],"skeleton":[13],"and":[14,44,138],"appearance":[16],"of":[17,64],"a":[18,22,103],"source":[19],"image.":[20],"As":[21],"popular":[23],"generative":[24],"model,":[25],"diffusion":[27,66,126],"model":[28,67],"shows":[29],"its":[30],"potential.":[31],"However,":[32],"there":[33],"are":[34],"two":[35],"gaps":[36],"to":[37,56,88,96,107,121],"hinder":[38],"fusion":[40],"between":[41],"information":[43,51],"appearance:":[45],"1)":[46],"Directly":[47],"injecting":[48],"pixel-level":[49],"into":[52],"semantic":[53],"features":[54,120],"leads":[55],"representation":[58],"gap.":[59,71],"2)":[60],"The":[61],"timestep-dependent":[62],"nature":[63],"introduces":[68],"noise-induced":[70],"To":[72],"alleviate":[73],"these,":[74],"we":[75,82,101,117],"propose":[76,102],"Diffusion":[77],"with":[78],"Noise-Aware":[79],"Feature(DNAF).":[80],"Concretely,":[81],"leverage":[83],"T2I-Adapter-based":[85],"adapter":[87],"achieve":[89],"mapping":[91],"from":[92],"pixel":[94],"level":[95],"feature":[98,112],"level.":[99],"Then,":[100],"lightweight":[104],"trainable":[105],"layer":[106],"infuse":[108],"multi-scale":[110],"constant":[111],"adaptively.":[113],"In":[114],"end,":[116],"construct":[118],"noise-aware":[119],"more":[122],"effectively":[123],"guide":[124],"process.":[127],"Experimental":[128],"results":[129,135],"show":[130],"that":[131],"DNAF":[132],"achieves":[133],"competitive":[134],"DeepFashion":[137],"Market-1501":[139],"datasets.":[140]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
