{"id":"https://openalex.org/W4392427699","doi":"https://doi.org/10.1145/3664647.3680692","title":"When ControlNet Meets Inexplicit Masks: A Case Study of ControlNet on its Contour-following Ability","display_name":"When ControlNet Meets Inexplicit Masks: A Case Study of ControlNet on its Contour-following Ability","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4392427699","doi":"https://doi.org/10.1145/3664647.3680692"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3680692","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680692","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2403.00467","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094063499","display_name":"Wenjie Xuan","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenjie Xuan","raw_affiliation_strings":["School of Computer Science, National Engineering Research Center for Multimedia Software, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, National Engineering Research Center for Multimedia Software, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101142434","display_name":"Yufei Xi Zhiyong Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Yufei Xu","raw_affiliation_strings":["The University of Sydney, Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003926666","display_name":"Shanshan Zhao","orcid":"https://orcid.org/0000-0002-5828-4881"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Shanshan Zhao","raw_affiliation_strings":["The University of Sydney, Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101701657","display_name":"Chaoyue Wang","orcid":"https://orcid.org/0000-0002-9002-1029"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Chaoyue Wang","raw_affiliation_strings":["The University of Sydney, Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111140222","display_name":"Juhua Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Juhua Liu","raw_affiliation_strings":["School of Computer Science, National Engineering Research Center for Multimedia Software, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, National Engineering Research Center for Multimedia Software, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060042752","display_name":"Bo Du","orcid":"https://orcid.org/0000-0002-0059-8458"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Du","raw_affiliation_strings":["School of Computer Science, National Engineering Research Center for Multimedia Software, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, National Engineering Research Center for Multimedia Software, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110189407","display_name":"Dacheng Tao","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dacheng Tao","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5094063499"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":1.0535,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.78955937,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"6979","last_page":"6988"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.31679999828338623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.31679999828338623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5035058856010437},{"id":"https://openalex.org/keywords/engineering-drawing","display_name":"Engineering drawing","score":0.38579535484313965},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.32476240396499634},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2528120279312134}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5035058856010437},{"id":"https://openalex.org/C199639397","wikidata":"https://www.wikidata.org/wiki/Q1788588","display_name":"Engineering drawing","level":1,"score":0.38579535484313965},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.32476240396499634},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2528120279312134}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3664647.3680692","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680692","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2403.00467","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.00467","pdf_url":"https://arxiv.org/pdf/2403.00467","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2403.00467","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.00467","pdf_url":"https://arxiv.org/pdf/2403.00467","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W845365781","https://openalex.org/W1861492603","https://openalex.org/W2466618734","https://openalex.org/W2948672349","https://openalex.org/W2955639361","https://openalex.org/W2962770929","https://openalex.org/W2982450728","https://openalex.org/W4281485151","https://openalex.org/W4283791382","https://openalex.org/W4312911498","https://openalex.org/W4312933868","https://openalex.org/W4385327947","https://openalex.org/W4385537492","https://openalex.org/W4386075631","https://openalex.org/W4386076027","https://openalex.org/W4388191573","https://openalex.org/W4390873054","https://openalex.org/W4393148714","https://openalex.org/W4402753907"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W1979597421","https://openalex.org/W2007980826","https://openalex.org/W2061531152","https://openalex.org/W3002753104","https://openalex.org/W2077600819","https://openalex.org/W2142036596","https://openalex.org/W2072657027","https://openalex.org/W2600246793","https://openalex.org/W4238204885"],"abstract_inverted_index":{"ControlNet":[0,64,122],"excels":[1],"at":[2,157],"creating":[3],"content":[4],"that":[5],"closely":[6],"matches":[7],"precise":[8],"contours":[9],"in":[10,93,111,120],"user-provided":[11],"masks.":[12,87,114],"However,":[13],"when":[14],"these":[15,44],"masks":[16,46],"contain":[17],"noise,":[18],"as":[19],"a":[20,67,71,94],"frequent":[21],"occurrence":[22],"with":[23,47,58],"non-expert":[24],"users,":[25],"the":[26,36,41,81,85,100,108,112,133],"output":[27],"would":[28],"include":[29],"unwanted":[30],"artifacts.":[31],"This":[32],"paper":[33],"first":[34],"highlights":[35],"crucial":[37],"role":[38],"of":[39,43,66,84,140],"controlling":[40],"impact":[42],"inexplicit":[45,59,113],"diverse":[48,138],"deterioration":[49,68,78,82],"levels":[50],"through":[51],"in-depth":[52],"analysis.":[53],"Subsequently,":[54],"to":[55,97,123],"enhance":[56],"controllability":[57],"masks,":[60],"an":[61],"advanced":[62],"Shape-aware":[63],"consisting":[65],"estimator":[69,79],"and":[70,150],"shape-prior":[72],"modulation":[73,95],"block":[74,96],"is":[75,91],"devised.":[76],"The":[77],"assesses":[80],"factor":[83,90],"provided":[86],"Then":[88],"this":[89],"used":[92],"adaptively":[98],"adjust":[99],"model's":[101],"contour-following":[102],"ability,":[103],"which":[104],"helps":[105],"it":[106],"dismiss":[107],"noise":[109],"part":[110],"Extensive":[115],"experiments":[116],"prove":[117],"its":[118],"effectiveness":[119],"encouraging":[121],"interpret":[124],"inaccurate":[125],"spatial":[126],"conditions":[127],"robustly":[128],"rather":[129],"than":[130],"blindly":[131],"following":[132],"given":[134],"contours,":[135],"suitable":[136],"for":[137],"kinds":[139],"conditions.":[141],"We":[142],"showcase":[143],"application":[144],"scenarios":[145],"like":[146],"modifying":[147],"shape":[148],"priors":[149],"composable":[151],"shape-controllable":[152],"generation.":[153],"Codes":[154],"are":[155],"available":[156],"github.":[158]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-03-25T14:56:36.534964","created_date":"2025-10-10T00:00:00"}
