{"id":"https://openalex.org/W4403780713","doi":"https://doi.org/10.1145/3664647.3680693","title":"HandRefiner: Refining Malformed Hands in Generated Images by Diffusion-based Conditional Inpainting","display_name":"HandRefiner: Refining Malformed Hands in Generated Images by Diffusion-based Conditional Inpainting","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403780713","doi":"https://doi.org/10.1145/3664647.3680693"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3680693","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680693","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103713743","display_name":"Wenquan Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Wenquan Lu","raw_affiliation_strings":["The University of Sydney, Sydney, Australia"],"raw_orcid":"https://orcid.org/0009-0004-6503-5447","affiliations":[{"raw_affiliation_string":"The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042154277","display_name":"Yufei Xu","orcid":"https://orcid.org/0000-0002-9931-5138"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Yufei Xu","raw_affiliation_strings":["The University of Sydney, Sydney, Australia"],"raw_orcid":"https://orcid.org/0000-0002-9931-5138","affiliations":[{"raw_affiliation_string":"The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100345321","display_name":"Jing Zhang","orcid":"https://orcid.org/0000-0001-6595-7661"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Jing Zhang","raw_affiliation_strings":["The University of Sydney, Sydney, Australia"],"raw_orcid":"https://orcid.org/0000-0001-6595-7661","affiliations":[{"raw_affiliation_string":"The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101701657","display_name":"Chaoyue Wang","orcid":"https://orcid.org/0000-0002-9002-1029"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Chaoyue Wang","raw_affiliation_strings":["The University of Sydney, Sydney, Australia"],"raw_orcid":"https://orcid.org/0000-0002-9002-1029","affiliations":[{"raw_affiliation_string":"The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074103823","display_name":"Dacheng Tao","orcid":"https://orcid.org/0000-0001-7225-5449"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dacheng Tao","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-7225-5449","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5103713743"],"corresponding_institution_ids":["https://openalex.org/I129604602"],"apc_list":null,"apc_paid":null,"fwci":3.4529,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.93935328,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"7085","last_page":"7093"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inpainting","display_name":"Inpainting","score":0.9211761951446533},{"id":"https://openalex.org/keywords/refining","display_name":"Refining (metallurgy)","score":0.7681886553764343},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.622501015663147},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6219666004180908},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5347280502319336},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.44332197308540344},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.39283353090286255},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3795055150985718},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2709837257862091},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.09768170118331909}],"concepts":[{"id":"https://openalex.org/C11727466","wikidata":"https://www.wikidata.org/wiki/Q1628157","display_name":"Inpainting","level":3,"score":0.9211761951446533},{"id":"https://openalex.org/C60044698","wikidata":"https://www.wikidata.org/wiki/Q1283324","display_name":"Refining (metallurgy)","level":2,"score":0.7681886553764343},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.622501015663147},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6219666004180908},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5347280502319336},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.44332197308540344},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.39283353090286255},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3795055150985718},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2709837257862091},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.09768170118331909},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C191897082","wikidata":"https://www.wikidata.org/wiki/Q11467","display_name":"Metallurgy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3664647.3680693","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680693","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2101032778","https://openalex.org/W2559085405","https://openalex.org/W2768683308","https://openalex.org/W2955639361","https://openalex.org/W2962845008","https://openalex.org/W2973857456","https://openalex.org/W3081167590","https://openalex.org/W3174458495","https://openalex.org/W3204715535","https://openalex.org/W4212774754","https://openalex.org/W4243294870","https://openalex.org/W4312497550","https://openalex.org/W4312933868","https://openalex.org/W4383472654","https://openalex.org/W4386072118","https://openalex.org/W4390872297","https://openalex.org/W4390873054","https://openalex.org/W4393148622","https://openalex.org/W4393148714","https://openalex.org/W4402660144"],"related_works":["https://openalex.org/W2380775572","https://openalex.org/W2213520135","https://openalex.org/W2244018504","https://openalex.org/W4242046654","https://openalex.org/W3174923100","https://openalex.org/W3134074939","https://openalex.org/W2117562399","https://openalex.org/W4298074124","https://openalex.org/W2587407424","https://openalex.org/W1523707610"],"abstract_inverted_index":{"Diffusion":[0],"models":[1],"have":[2],"achieved":[3],"remarkable":[4],"success":[5],"in":[6,110],"generating":[7,13],"realistic":[8,167],"images":[9],"but":[10],"suffer":[11],"from":[12,28,41,162],"accurate":[14],"human":[15],"hands,":[16,122],"such":[17,129],"as":[18,142],"incorrect":[19],"finger":[20],"counts":[21],"or":[22],"irregular":[23],"shapes.":[24],"This":[25],"difficulty":[26],"arises":[27],"the":[29,34,78,83,92,106,111,145,163,178],"complex":[30],"task":[31],"of":[32,39,77,95,104,154],"learning":[33],"physical":[35],"structure":[36],"and":[37,48,97,168,182],"pose":[38,109],"hands":[40,72],"training":[42],"images,":[43],"which":[44],"involves":[45],"extensive":[46],"deformations":[47],"occlusions.":[49],"For":[50],"correct":[51,93,130],"hand":[52,84,98,108,131],"generation,":[53],"our":[54],"paper":[55],"introduces":[56],"a":[57,65,115,136],"lightweight":[58],"post-processing":[59],"solution":[60],"called":[61],"HandRefiner.":[62],"HandRefiner":[63,174],"employs":[64],"conditional":[66],"inpainting":[67],"approach":[68],"to":[69,91,120,127,151],"rectify":[70],"malformed":[71,121],"while":[73,100],"leaving":[74],"other":[75],"parts":[76],"image":[79,118],"untouched.":[80],"We":[81],"leverage":[82],"mesh":[85],"reconstruction":[86],"model":[87],"that":[88,173],"consistently":[89],"adheres":[90],"number":[94],"fingers":[96],"shape,":[99],"also":[101],"being":[102],"capable":[103],"fitting":[105],"desired":[107],"generated":[112,116],"image.":[113],"Given":[114],"failed":[117],"due":[119],"we":[123,134,143],"utilize":[124],"ControlNet":[125,141],"modules":[126],"re-inject":[128],"information.":[132],"Additionally,":[133],"uncover":[135],"phase":[137],"transition":[138],"phenomenon":[139],"within":[140],"vary":[144],"control":[146],"strength.":[147],"It":[148],"enables":[149],"us":[150],"take":[152],"advantage":[153],"more":[155],"readily":[156],"available":[157,187],"synthetic":[158,169],"data":[159],"without":[160],"suffering":[161],"domain":[164],"gap":[165],"between":[166],"hands.":[170],"Experiments":[171],"demonstrate":[172],"can":[175],"significantly":[176],"improve":[177],"generation":[179],"quality":[180],"quantitatively":[181],"qualitatively.":[183],"The":[184],"code":[185],"is":[186],"at":[188],"https://github.com/wenquanlu/HandRefiner.":[189]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":5}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-10T00:00:00"}
