{"id":"https://openalex.org/W4412985088","doi":"https://doi.org/10.1109/tpami.2025.3595880","title":"InstructLayout: Instruction-Driven 2D and 3D Layout Synthesis With Semantic Graph Prior","display_name":"InstructLayout: Instruction-Driven 2D and 3D Layout Synthesis With Semantic Graph Prior","publication_year":2025,"publication_date":"2025-08-05","ids":{"openalex":"https://openalex.org/W4412985088","doi":"https://doi.org/10.1109/tpami.2025.3595880","pmid":"https://pubmed.ncbi.nlm.nih.gov/40763054"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3595880","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3595880","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101179369","display_name":"Chenguo Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenguo Lin","raw_affiliation_strings":["Wangxuan Institute of Computer Technology, Peking University, Beijing, China","Wangxuan Institute of Computer Technology, Peking University, China"],"raw_orcid":"https://orcid.org/0000-0002-6872-7471","affiliations":[{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101961542","display_name":"Yu-Chen Lin","orcid":"https://orcid.org/0009-0006-0144-6700"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuchen Lin","raw_affiliation_strings":["Wangxuan Institute of Computer Technology, Peking University, Beijing, China","Wangxuan Institute of Computer Technology, Peking University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099381065","display_name":"Panwang Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I6507939","display_name":"China United Network Communications Group (China)","ror":"https://ror.org/028w99c90","country_code":"CN","type":"company","lineage":["https://openalex.org/I6507939"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Panwang Pan","raw_affiliation_strings":["PICO AI Group, ByteDance, Beijing, China","PICO AI group, ByteDance, China"],"raw_orcid":"https://orcid.org/0000-0001-8631-012X","affiliations":[{"raw_affiliation_string":"PICO AI Group, ByteDance, Beijing, China","institution_ids":["https://openalex.org/I6507939"]},{"raw_affiliation_string":"PICO AI group, ByteDance, China","institution_ids":["https://openalex.org/I6507939"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041793389","display_name":"Xuanyang Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I6507939","display_name":"China United Network Communications Group (China)","ror":"https://ror.org/028w99c90","country_code":"CN","type":"company","lineage":["https://openalex.org/I6507939"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuanyang Zhang","raw_affiliation_strings":["PICO AI Group, ByteDance, Beijing, China","PICO AI group, ByteDance, China"],"raw_orcid":"https://orcid.org/0000-0001-5092-8657","affiliations":[{"raw_affiliation_string":"PICO AI Group, ByteDance, Beijing, China","institution_ids":["https://openalex.org/I6507939"]},{"raw_affiliation_string":"PICO AI group, ByteDance, China","institution_ids":["https://openalex.org/I6507939"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028877572","display_name":"Yadong Mu","orcid":"https://orcid.org/0000-0001-7815-3750"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yadong Mu","raw_affiliation_strings":["Wangxuan Institute of Computer Technology, Peking University, Beijing, China","Wangxuan Institute of Computer Technology, Peking University, China"],"raw_orcid":"https://orcid.org/0000-0001-7815-3750","affiliations":[{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.9045,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.78543941,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"47","issue":"12","first_page":"11040","last_page":"11050"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.9768999814987183,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7477964162826538},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5462051630020142},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.49178197979927063},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.46386924386024475},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35201990604400635},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.33101457357406616},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3302878737449646}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7477964162826538},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5462051630020142},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.49178197979927063},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.46386924386024475},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35201990604400635},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33101457357406616},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3302878737449646}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3595880","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3595880","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:40763054","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40763054","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W2326925005","https://openalex.org/W2760103357","https://openalex.org/W2798622261","https://openalex.org/W2949924544","https://openalex.org/W2960202457","https://openalex.org/W2963184176","https://openalex.org/W2963601843","https://openalex.org/W2964334375","https://openalex.org/W2990222759","https://openalex.org/W3000176874","https://openalex.org/W3016025127","https://openalex.org/W3035108870","https://openalex.org/W3095066959","https://openalex.org/W3190835409","https://openalex.org/W3195692323","https://openalex.org/W3199003182","https://openalex.org/W3202536355","https://openalex.org/W3204757729","https://openalex.org/W4205481600","https://openalex.org/W4214625308","https://openalex.org/W4214755412","https://openalex.org/W4214778243","https://openalex.org/W4285605355","https://openalex.org/W4289436753","https://openalex.org/W4304080663","https://openalex.org/W4312388283","https://openalex.org/W4317033447","https://openalex.org/W4385245566","https://openalex.org/W4385572884","https://openalex.org/W4386071540","https://openalex.org/W4386071617","https://openalex.org/W4386071810","https://openalex.org/W4386076211","https://openalex.org/W4386607324","https://openalex.org/W4387967982","https://openalex.org/W4387968707","https://openalex.org/W4389298345","https://openalex.org/W4390874211","https://openalex.org/W4402753875","https://openalex.org/W4413147469"],"related_works":["https://openalex.org/W4213212078","https://openalex.org/W2187227032","https://openalex.org/W2112788825","https://openalex.org/W1921169094","https://openalex.org/W1963735073","https://openalex.org/W4233129888","https://openalex.org/W366410996","https://openalex.org/W106707639","https://openalex.org/W2793742470","https://openalex.org/W2146247781"],"abstract_inverted_index":{"Comprehending":[0],"natural":[1],"language":[2,106],"instructions":[3],"is":[4],"a":[5,33,39,44,77,123],"charming":[6],"property":[7],"for":[8,52,84],"both":[9,127],"2D":[10,53,86,128],"and":[11,23,43,50,54,66,87,107,129],"3D":[12,55,88,130],"layout":[13,45,56,64,131],"synthesis":[14,132],"systems.":[15],"Existing":[16],"methods":[17],"implicitly":[18],"model":[19],"object":[20,25,67],"joint":[21],"distributions":[22,68],"express":[24],"relations,":[26],"hindering":[27],"generation's":[28],"controllability.":[29],"We":[30],"introduce":[31],"InstructLayout,":[32],"novel":[34],"generative":[35],"framework":[36],"that":[37,114],"integrates":[38],"semantic":[40,60],"graph":[41,61],"prior":[42,62],"decoder":[46],"to":[47],"improve":[48],"controllability":[49],"fidelity":[51],"synthesis.":[57],"The":[58],"proposed":[59,116],"learns":[63],"appearances":[65],"simultaneously,":[69],"demonstrating":[70],"versatility":[71],"across":[72],"various":[73],"downstream":[74],"tasks":[75],"in":[76,126],"zero-shot":[78],"manner.":[79],"To":[80],"facilitate":[81],"the":[82,115,138],"benchmarking":[83],"text-driven":[85],"scene":[89],"synthesis,":[90],"we":[91],"respectively":[92],"curate":[93],"two":[94],"high-quality":[95],"datasets":[96],"of":[97,140],"layout-instruction":[98],"pairs":[99],"from":[100],"public":[101],"Internet":[102],"resources":[103],"with":[104],"large":[105,124],"multimodal":[108],"models.":[109],"Extensive":[110],"experimental":[111],"results":[112],"reveal":[113],"method":[117],"outperforms":[118],"existing":[119],"state-of-the-art":[120],"approaches":[121],"by":[122],"margin":[125],"tasks.":[133],"Thorough":[134],"ablation":[135],"studies":[136],"confirm":[137],"efficacy":[139],"crucial":[141],"design":[142],"components.":[143]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
