{"id":"https://openalex.org/W7161704392","doi":"https://doi.org/10.48550/arxiv.2605.17527","title":"Designing streetscapes from street-view imagery using diffusion models","display_name":"Designing streetscapes from street-view imagery using diffusion models","publication_year":2026,"publication_date":"2026-05-17","ids":{"openalex":"https://openalex.org/W7161704392","doi":"https://doi.org/10.48550/arxiv.2605.17527"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.17527","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17527","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.17527","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009756467","display_name":"Yuzhou Chen","orcid":"https://orcid.org/0000-0002-1556-084X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yuzhou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041224976","display_name":"Yuebing Liang","orcid":"https://orcid.org/0000-0003-2089-4606"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Yuebing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001267615","display_name":"Lingqian Hu","orcid":"https://orcid.org/0000-0002-5687-0764"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Lingqian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052099130","display_name":"Kailai Sun","orcid":"https://orcid.org/0000-0003-1648-3409"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Kailai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136490346","display_name":"Qingqi Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Qingqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029114955","display_name":"Chang Zhao","orcid":"https://orcid.org/0000-0002-5389-0479"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Chang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136471743","display_name":"Shenhao Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Shenhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13282","display_name":"Automated Road and Building Extraction","score":0.3695000112056732,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13282","display_name":"Automated Road and Building Extraction","score":0.3695000112056732,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11980","display_name":"Human Mobility and Location-Based Analysis","score":0.09969999641180038,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10692","display_name":"Urban Green Space and Health","score":0.05810000002384186,"subfield":{"id":"https://openalex.org/subfields/2307","display_name":"Health, Toxicology and Mutagenesis"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5302000045776367},{"id":"https://openalex.org/keywords/urban-planning","display_name":"Urban planning","score":0.48019999265670776},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4693000018596649},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4684999883174896},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4611000120639801},{"id":"https://openalex.org/keywords/geospatial-analysis","display_name":"Geospatial analysis","score":0.4596000015735626},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.43790000677108765},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.4034000039100647}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.697700023651123},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5302000045776367},{"id":"https://openalex.org/C49545453","wikidata":"https://www.wikidata.org/wiki/Q69883","display_name":"Urban planning","level":2,"score":0.48019999265670776},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4693000018596649},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4684999883174896},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4611000120639801},{"id":"https://openalex.org/C9770341","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Geospatial analysis","level":2,"score":0.4596000015735626},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.43790000677108765},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4180999994277954},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.4034000039100647},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.4020000100135803},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.40049999952316284},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.38909998536109924},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.34150001406669617},{"id":"https://openalex.org/C2777055276","wikidata":"https://www.wikidata.org/wiki/Q7936580","display_name":"Visual approach","level":2,"score":0.3398999869823456},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.3199999928474426},{"id":"https://openalex.org/C14669888","wikidata":"https://www.wikidata.org/wiki/Q4014850","display_name":"Creative visualization","level":3,"score":0.2806999981403351},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.27889999747276306},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2782999873161316},{"id":"https://openalex.org/C2778102629","wikidata":"https://www.wikidata.org/wiki/Q725252","display_name":"Satellite imagery","level":2,"score":0.2651999890804291},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.25589999556541443}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.17527","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17527","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.17527","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17527","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities","score":0.82978355884552}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Street-view":[0],"imagery":[1,125,132,211],"(SVI)":[2],"is":[3,43],"widely":[4],"used":[5],"to":[6,128],"quantify":[7],"key":[8],"indicators":[9],"of":[10,36,81,103,223],"urban":[11,40,52,82,229,263],"environment,":[12],"such":[13,50],"as":[14,51,172,255],"green-":[15],"ery,":[16],"sky,":[17],"or":[18],"road":[19,98],"view":[20,187],"indices.":[21,188],"However,":[22],"existing":[23],"studies":[24],"largely":[25],"focus":[26],"on":[27,73],"measuring":[28],"current":[29],"streetscapes":[30,71],"and":[31,38,54,100,108,121,131,168,201,204,207,220,245,248,259],"rarely":[32],"support":[33],"the":[34,147,175,221],"generation":[35,190,241],"alternative":[37,70],"non-existing":[39],"scenarios,":[41],"which":[42],"a":[44,62,87,195,216,256],"core":[45],"task":[46],"in":[47,106,166,170,194],"geospatial":[48],"disciplines":[49],"planning":[53],"design.":[55],"To":[56],"address":[57],"this":[58,111,233],"gap,":[59],"we":[60,113],"propose":[61],"gener-":[63],"ative":[64],"multimodal":[65,88],"AI":[66,252],"framework":[67],"that":[68,90,115,138],"synthesizes":[69],"conditioned":[72],"targeted":[74],"visual":[75,79,104,140,156,200,208,226],"metrics,":[76],"enabling":[77],"direct":[78],"exploration":[80],"scenarios.":[83],"We":[84],"first":[85],"construct":[86],"dataset":[89],"aligns":[91],"SVIs":[92,244],"with":[93,178],"textual":[94,130,202,206],"descriptions,":[95],"segmentation":[96],"maps,":[97],"masks,":[99],"quantitative":[101,135],"metrics":[102],"elements":[105],"Chicago":[107],"Orlando.":[109],"Using":[110],"dataset,":[112],"demonstrate":[114],"diffusion":[116,246],"models":[117],"can":[118,142,191,253],"produce":[119],"realistic":[120],"semantically":[122],"consistent":[123],"streetscape":[124,240],"while":[126,153],"responding":[127],"both":[129,199],"controls.":[133],"Our":[134],"evaluations":[136],"show":[137],"incorporating":[139],"controls":[141,209,212,227],"improve":[143],"semantic":[144,161],"consistency,":[145],"reducing":[146],"LPIPS":[148],"index":[149],"by":[150,164,174,198],"approximately":[151],"6%":[152],"maintaining":[154],"global":[155],"realism.":[157],"In":[158],"addition,":[159],"overall":[160],"consistency":[162],"increases":[163],"23.7%":[165],"Orlando":[167],"46.4%":[169],"Chicago,":[171],"measured":[173],"mIoU":[176],"index,":[177],"class-wise":[179],"gains":[180],"exceeding":[181],"even":[182],"100%":[183],"improvement":[184],"for":[185,228,239,262],"building":[186],"Streetscape":[189],"be":[192],"controlled":[193],"fine-grained":[196],"manner":[197],"prompts,":[203],"when":[205],"conflict,":[210],"consistently":[213],"dominate,":[214],"indicating":[215],"clear":[217],"control":[218],"hierarchy":[219],"importance":[222],"further":[224],"developing":[225],"scene":[230],"generation.":[231],"Overall,":[232],"work":[234],"establishes":[235],"an":[236],"important":[237],"benchmark":[238],"us-":[242],"ing":[243],"models,":[247],"illustrates":[249],"how":[250],"generative":[251],"serve":[254],"practical,":[257],"scalable,":[258],"controllable":[260],"approach":[261],"scenario":[264],"exploration.":[265]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-20T00:00:00"}
