{"id":"https://openalex.org/W3112593261","doi":"https://doi.org/10.1109/tpami.2022.3181587","title":"Semantic Layout Manipulation With High-Resolution Sparse Attention","display_name":"Semantic Layout Manipulation With High-Resolution Sparse Attention","publication_year":2022,"publication_date":"2022-06-13","ids":{"openalex":"https://openalex.org/W3112593261","doi":"https://doi.org/10.1109/tpami.2022.3181587","mag":"3112593261","pmid":"https://pubmed.ncbi.nlm.nih.gov/35696464"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2022.3181587","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3181587","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016267591","display_name":"Haitian Zheng","orcid":"https://orcid.org/0000-0003-0415-1765"},"institutions":[{"id":"https://openalex.org/I5388228","display_name":"University of Rochester","ror":"https://ror.org/022kthw22","country_code":"US","type":"education","lineage":["https://openalex.org/I5388228"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Haitian Zheng","raw_affiliation_strings":["Department of Computer Science, University of Rochester, Rochester, NY, USA"],"raw_orcid":"https://orcid.org/0000-0003-0415-1765","affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Rochester, Rochester, NY, USA","institution_ids":["https://openalex.org/I5388228"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101564904","display_name":"Zhe Lin","orcid":"https://orcid.org/0000-0003-1154-9907"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhe Lin","raw_affiliation_strings":["Adobe Research, San Jose, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-1154-9907","affiliations":[{"raw_affiliation_string":"Adobe Research, San Jose, CA, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085050428","display_name":"Jingwan Lu","orcid":"https://orcid.org/0000-0002-3598-9918"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jingwan Lu","raw_affiliation_strings":["Adobe Research, San Jose, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research, San Jose, CA, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055156362","display_name":"Scott Cohen","orcid":"https://orcid.org/0000-0002-3459-6899"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Scott Cohen","raw_affiliation_strings":["Adobe Research, San Jose, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research, San Jose, CA, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036510129","display_name":"Jianming Zhang","orcid":"https://orcid.org/0000-0002-9954-6294"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jianming Zhang","raw_affiliation_strings":["Adobe Research, San Jose, CA, USA"],"raw_orcid":"https://orcid.org/0000-0002-9954-6294","affiliations":[{"raw_affiliation_string":"Adobe Research, San Jose, CA, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101773973","display_name":"Ning Xu","orcid":"https://orcid.org/0000-0001-8910-0937"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ning Xu","raw_affiliation_strings":["Adobe Research, San Jose, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research, San Jose, CA, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055469774","display_name":"Jiebo Luo","orcid":"https://orcid.org/0000-0002-4516-9729"},"institutions":[{"id":"https://openalex.org/I5388228","display_name":"University of Rochester","ror":"https://ror.org/022kthw22","country_code":"US","type":"education","lineage":["https://openalex.org/I5388228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiebo Luo","raw_affiliation_strings":["Department of Computer Science, University of Rochester, Rochester, NY, USA"],"raw_orcid":"https://orcid.org/0000-0002-4516-9729","affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Rochester, Rochester, NY, USA","institution_ids":["https://openalex.org/I5388228"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5016267591"],"corresponding_institution_ids":["https://openalex.org/I5388228"],"apc_list":null,"apc_paid":null,"fwci":0.8163,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.71723483,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":"45","issue":"3","first_page":"3768","last_page":"3782"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8640379905700684},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6653608679771423},{"id":"https://openalex.org/keywords/image-warping","display_name":"Image warping","score":0.576998233795166},{"id":"https://openalex.org/keywords/inpainting","display_name":"Inpainting","score":0.5571030378341675},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.544503390789032},{"id":"https://openalex.org/keywords/texture-synthesis","display_name":"Texture synthesis","score":0.5106938481330872},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.4896707832813263},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.45674553513526917},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.45185959339141846},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4413035809993744},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.42846575379371643},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4262772798538208},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.24568864703178406},{"id":"https://openalex.org/keywords/image-texture","display_name":"Image texture","score":0.17540976405143738}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8640379905700684},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6653608679771423},{"id":"https://openalex.org/C157202957","wikidata":"https://www.wikidata.org/wiki/Q1659609","display_name":"Image warping","level":2,"score":0.576998233795166},{"id":"https://openalex.org/C11727466","wikidata":"https://www.wikidata.org/wiki/Q1628157","display_name":"Inpainting","level":3,"score":0.5571030378341675},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.544503390789032},{"id":"https://openalex.org/C50494287","wikidata":"https://www.wikidata.org/wiki/Q658467","display_name":"Texture synthesis","level":5,"score":0.5106938481330872},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.4896707832813263},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.45674553513526917},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.45185959339141846},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4413035809993744},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.42846575379371643},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4262772798538208},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.24568864703178406},{"id":"https://openalex.org/C63099799","wikidata":"https://www.wikidata.org/wiki/Q17147001","display_name":"Image texture","level":4,"score":0.17540976405143738},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2022.3181587","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3181587","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:35696464","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35696464","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":85,"referenced_works":["https://openalex.org/W603908379","https://openalex.org/W1686810756","https://openalex.org/W1763426478","https://openalex.org/W1924619199","https://openalex.org/W1975049209","https://openalex.org/W1993120651","https://openalex.org/W1999360130","https://openalex.org/W2099471712","https://openalex.org/W2115273023","https://openalex.org/W2116013899","https://openalex.org/W2124386111","https://openalex.org/W2133564696","https://openalex.org/W2133665775","https://openalex.org/W2141155330","https://openalex.org/W2292976057","https://openalex.org/W2302243225","https://openalex.org/W2331128040","https://openalex.org/W2519536754","https://openalex.org/W2593414223","https://openalex.org/W2611605760","https://openalex.org/W2732026016","https://openalex.org/W2737258237","https://openalex.org/W2774267535","https://openalex.org/W2798600195","https://openalex.org/W2801693445","https://openalex.org/W2804078698","https://openalex.org/W2907097116","https://openalex.org/W2952716587","https://openalex.org/W2961363059","https://openalex.org/W2962770929","https://openalex.org/W2962785568","https://openalex.org/W2962793481","https://openalex.org/W2962974533","https://openalex.org/W2963073614","https://openalex.org/W2963522749","https://openalex.org/W2963800363","https://openalex.org/W2963840672","https://openalex.org/W2963890275","https://openalex.org/W2963920537","https://openalex.org/W2964121744","https://openalex.org/W2964125246","https://openalex.org/W2964148878","https://openalex.org/W2964309429","https://openalex.org/W2966926453","https://openalex.org/W2981682056","https://openalex.org/W2981689412","https://openalex.org/W2982763192","https://openalex.org/W2982809261","https://openalex.org/W3014641072","https://openalex.org/W3015643106","https://openalex.org/W3034438741","https://openalex.org/W3034515601","https://openalex.org/W3034667262","https://openalex.org/W3034723751","https://openalex.org/W3034950620","https://openalex.org/W3043547428","https://openalex.org/W3101838243","https://openalex.org/W3108501258","https://openalex.org/W3108554146","https://openalex.org/W3109174731","https://openalex.org/W3109276915","https://openalex.org/W3122887115","https://openalex.org/W3158252298","https://openalex.org/W3159890710","https://openalex.org/W3169001068","https://openalex.org/W3180675665","https://openalex.org/W4294643831","https://openalex.org/W6637373629","https://openalex.org/W6677548441","https://openalex.org/W6679434410","https://openalex.org/W6696085341","https://openalex.org/W6698256120","https://openalex.org/W6718379498","https://openalex.org/W6734074887","https://openalex.org/W6739901393","https://openalex.org/W6745560452","https://openalex.org/W6747225742","https://openalex.org/W6750942122","https://openalex.org/W6752378368","https://openalex.org/W6753955284","https://openalex.org/W6754416387","https://openalex.org/W6755312952","https://openalex.org/W6757857098","https://openalex.org/W6765779288","https://openalex.org/W6779669310"],"related_works":["https://openalex.org/W2385244905","https://openalex.org/W1554980273","https://openalex.org/W2021008485","https://openalex.org/W2352164403","https://openalex.org/W2317681159","https://openalex.org/W2368324430","https://openalex.org/W2771814581","https://openalex.org/W2616924144","https://openalex.org/W2085292936","https://openalex.org/W2355113740"],"abstract_inverted_index":{"We":[0],"tackle":[1],"the":[2,35,39,45,78,82,94,144,158],"problem":[3,24],"of":[4,25,84,131],"semantic":[5,19,41,133],"image":[6,15,47],"layout":[7,42,62,95,162],"manipulation,":[8],"which":[9],"aims":[10],"to":[11,30,38,72,77,110,117],"manipulate":[12],"an":[13],"input":[14,36],"by":[16],"editing":[17],"its":[18],"label":[20],"map.":[21],"A":[22],"core":[23],"this":[26,69,91],"task":[27],"is":[28],"how":[29],"transfer":[31,63],"visual":[32,108,122],"details":[33,75,109],"from":[34],"images":[37],"new":[40,111],"while":[43],"making":[44],"resulting":[46],"visually":[48],"realistic.":[49],"Recent":[50],"work":[51],"on":[52,87,143],"learning":[53],"cross-domain":[54],"correspondence":[55],"has":[56],"shown":[57],"promising":[58],"results":[59],"for":[60,93,139],"global":[61],"with":[64],"dense":[65],"attention-based":[66],"warping.":[67],"However,":[68],"method":[70],"tends":[71],"lose":[73],"texture":[74],"due":[76],"resolution":[79,115],"limitation":[80],"and":[81,135,146,161],"lack":[83],"smoothness":[85],"constraint":[86],"correspondence.":[88],"To":[89,119],"adapt":[90],"paradigm":[92],"manipulation":[96,163],"task,":[97],"we":[98,124],"propose":[99],"a":[100,114,126,132,136],"high-resolution":[101],"sparse":[102],"attention":[103],"module":[104],"that":[105,150],"effectively":[106],"transfers":[107],"layouts":[112],"at":[113],"up":[116],"512x512.":[118],"further":[120],"improve":[121],"quality,":[123],"introduce":[125],"novel":[127],"generator":[128],"architecture":[129],"consisting":[130],"encoder":[134],"two-stage":[137],"decoder":[138],"coarse-to-fine":[140],"synthesis.":[141],"Experiments":[142],"ADE20k":[145],"Places365":[147],"datasets":[148],"demonstrate":[149],"our":[151],"proposed":[152],"approach":[153],"achieves":[154],"substantial":[155],"improvements":[156],"over":[157],"existing":[159],"inpainting":[160],"methods.":[164]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
