{"id":"https://openalex.org/W4416060594","doi":"https://doi.org/10.1109/iccv51701.2025.01566","title":"Rethinking Layered Graphic Design Generation with a Top-Down Approach","display_name":"Rethinking Layered Graphic Design Generation with a Top-Down Approach","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4416060594","doi":"https://doi.org/10.1109/iccv51701.2025.01566"},"language":"en","primary_location":{"id":"doi:10.1109/iccv51701.2025.01566","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.01566","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2507.05601","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035486052","display_name":"J.C. Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jingye Chen","raw_affiliation_strings":["HKUST"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"HKUST","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068625652","display_name":"Zhaowen Wang","orcid":"https://orcid.org/0000-0002-4605-2506"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhaowen Wang","raw_affiliation_strings":["Adobe Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Nanxuan Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nanxuan Zhao","raw_affiliation_strings":["Adobe Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100425475","display_name":"Li Zhang","orcid":"https://orcid.org/0000-0001-9330-6727"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Li Zhang","raw_affiliation_strings":["Adobe Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041433128","display_name":"Difan Liu","orcid":"https://orcid.org/0000-0001-5971-2748"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Difan Liu","raw_affiliation_strings":["Adobe Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jimei Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jimei Yang","raw_affiliation_strings":["Runway"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Runway","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100719528","display_name":"Qifeng Chen","orcid":"https://orcid.org/0000-0003-0515-3826"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Qifeng Chen","raw_affiliation_strings":["HKUST"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"HKUST","institution_ids":["https://openalex.org/I200769079"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.28603477,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"16861","last_page":"16870"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10789","display_name":"Interactive and Immersive Displays","score":0.3093999922275543,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10789","display_name":"Interactive and Immersive Displays","score":0.3093999922275543,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.14810000360012054,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.08540000021457672,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.7677000164985657},{"id":"https://openalex.org/keywords/graphic-design","display_name":"Graphic design","score":0.5163999795913696},{"id":"https://openalex.org/keywords/page-layout","display_name":"Page layout","score":0.47380000352859497},{"id":"https://openalex.org/keywords/inpainting","display_name":"Inpainting","score":0.4287000000476837},{"id":"https://openalex.org/keywords/environmental-graphic-design","display_name":"Environmental graphic design","score":0.37059998512268066},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.3637000024318695},{"id":"https://openalex.org/keywords/design-elements-and-principles","display_name":"Design elements and principles","score":0.3544999957084656},{"id":"https://openalex.org/keywords/design-knowledge","display_name":"Design knowledge","score":0.33469998836517334}],"concepts":[{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.7677000164985657},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7185999751091003},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5608999729156494},{"id":"https://openalex.org/C15724806","wikidata":"https://www.wikidata.org/wiki/Q185925","display_name":"Graphic design","level":2,"score":0.5163999795913696},{"id":"https://openalex.org/C188985296","wikidata":"https://www.wikidata.org/wiki/Q868954","display_name":"Page layout","level":2,"score":0.47380000352859497},{"id":"https://openalex.org/C199639397","wikidata":"https://www.wikidata.org/wiki/Q1788588","display_name":"Engineering drawing","level":1,"score":0.45179998874664307},{"id":"https://openalex.org/C11727466","wikidata":"https://www.wikidata.org/wiki/Q1628157","display_name":"Inpainting","level":3,"score":0.4287000000476837},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3837999999523163},{"id":"https://openalex.org/C104247647","wikidata":"https://www.wikidata.org/wiki/Q185925","display_name":"Environmental graphic design","level":3,"score":0.37059998512268066},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.3637000024318695},{"id":"https://openalex.org/C33276779","wikidata":"https://www.wikidata.org/wiki/Q1943363","display_name":"Design elements and principles","level":2,"score":0.3544999957084656},{"id":"https://openalex.org/C2778712445","wikidata":"https://www.wikidata.org/wiki/Q5264352","display_name":"Design knowledge","level":3,"score":0.33469998836517334},{"id":"https://openalex.org/C153715457","wikidata":"https://www.wikidata.org/wiki/Q254183","display_name":"Augmented reality","level":2,"score":0.33399999141693115},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3228999972343445},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30329999327659607},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C2777466363","wikidata":"https://www.wikidata.org/wiki/Q17008971","display_name":"Design tool","level":2,"score":0.28600001335144043},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.28060001134872437},{"id":"https://openalex.org/C138852830","wikidata":"https://www.wikidata.org/wiki/Q2292993","display_name":"Design methods","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.26489999890327454},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.25600001215934753},{"id":"https://openalex.org/C201025465","wikidata":"https://www.wikidata.org/wiki/Q11248500","display_name":"User experience design","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/iccv51701.2025.01566","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.01566","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2507.05601","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.05601","pdf_url":"https://arxiv.org/pdf/2507.05601","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-167942","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-167942","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"},{"id":"doi:10.48550/arxiv.2507.05601","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.05601","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2507.05601","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.05601","pdf_url":"https://arxiv.org/pdf/2507.05601","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Graphic":[0],"design":[1,88,135,211,217,264],"is":[2,116],"crucial":[3],"for":[4],"conveying":[5],"ideas":[6],"and":[7,17,69,152,192,232,256,259],"messages.":[8],"Designers":[9],"usually":[10],"organize":[11],"their":[12,65],"work":[13],"into":[14,99],"objects,":[15],"backgrounds,":[16],"vectorized":[18],"text":[19,70,107,253,257],"layers":[20],"to":[21,95,137,158,179,196,254],"simplify":[22],"editing.":[23],"However,":[24],"this":[25,81],"workflow":[26],"demands":[27],"considerable":[28],"expertise.":[29],"With":[30],"the":[31,74,92,139,171,198,208,244],"rise":[32],"of":[33,39,76,200],"GenAI":[34],"methods,":[35],"an":[36],"endless":[37],"supply":[38],"high-quality":[40],"graphic":[41,87,201,210],"designs":[42,52,59,98],"in":[43,67,127,141,165,262],"pixel":[44],"format":[45],"has":[46],"become":[47],"more":[48],"accessible,":[49],"though":[50],"these":[51],"often":[53],"lack":[54],"editability.":[55],"Despite":[56],"this,":[57],"non-layered":[58],"still":[60],"inspire":[61],"human":[62],"designers,":[63],"influencing":[64],"choices":[66],"layouts":[68],"styles,":[71],"ultimately":[72],"guiding":[73],"creation":[75,199],"layered":[77,101,160],"designs.":[78],"Motivated":[79],"by":[80,112,169,225,235],"observation,":[82],"we":[83,134],"propose":[84],"Accordion,":[85],"a":[86,119,166,226],"generation":[89],"framework":[90],"taking":[91],"first":[93],"attempt":[94],"convert":[96],"AI-generated":[97,106,216],"editable":[100],"designs,":[102,161],"meanwhile":[103],"refining":[104],"nonsensical":[105],"with":[108,215,220],"meaningful":[109],"alternatives":[110],"guided":[111],"user":[113,233],"prompts.":[114],"It":[115],"built":[117],"around":[118],"vision":[120,187],"language":[121],"model":[122],"(VLM)":[123],"playing":[124],"distinct":[125],"roles":[126],"three":[128],"curated":[129],"stages.":[130],"For":[131],"each":[132,181],"stage,":[133],"prompts":[136],"guide":[138],"VLM":[140],"executing":[142],"different":[143],"tasks.":[144],"Distinct":[145],"from":[146],"existing":[147],"bottom-up":[148],"methods":[149],"(e.g.,":[150],"COLE":[151],"Open-COLE)":[153],"that":[154,238],"gradually":[155],"generate":[156],"elements":[157],"create":[159],"our":[162,205],"approach":[163],"works":[164],"top-down":[167],"manner":[168],"using":[170,207],"visually":[172],"harmonious":[173],"reference":[174],"image":[175],"as":[176,190,250],"global":[177],"guidance":[178],"decompose":[180],"layer.":[182],"Additionally,":[183],"it":[184],"leverages":[185],"multiple":[186],"experts":[188],"such":[189,249],"SAM":[191],"element":[193],"removal":[194],"models":[195],"facilitate":[197],"layers.":[202],"We":[203],"train":[204],"method":[206],"in-house":[209],"dataset":[212],"Design39K,":[213],"augmented":[214],"images":[218],"coupled":[219],"refined":[221],"ground":[222],"truth":[223],"created":[224],"customized":[227],"inpainting":[228],"model.":[229],"Experimental":[230],"results":[231,242],"studies":[234],"designers":[236],"show":[237],"Accordion":[239],"generates":[240],"favorable":[241],"on":[243],"DesignIntention":[245],"benchmark,":[246],"including":[247],"tasks":[248],"text-to-template,":[251],"adding":[252],"background,":[255],"de-rendering,":[258],"also":[260],"excels":[261],"creating":[263],"variations.":[265]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
