{"id":"https://openalex.org/W4385301582","doi":"https://doi.org/10.1109/iv55152.2023.10186698","title":"Urban-StyleGAN: Learning to Generate and Manipulate Images of Urban Scenes","display_name":"Urban-StyleGAN: Learning to Generate and Manipulate Images of Urban Scenes","publication_year":2023,"publication_date":"2023-06-04","ids":{"openalex":"https://openalex.org/W4385301582","doi":"https://doi.org/10.1109/iv55152.2023.10186698"},"language":"en","primary_location":{"id":"doi:10.1109/iv55152.2023.10186698","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/iv55152.2023.10186698","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Intelligent Vehicles Symposium (IV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049254859","display_name":"George Eskandar","orcid":"https://orcid.org/0000-0002-8099-8717"},"institutions":[{"id":"https://openalex.org/I100066346","display_name":"University of Stuttgart","ror":"https://ror.org/04vnq7t77","country_code":"DE","type":"education","lineage":["https://openalex.org/I100066346"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"George Eskandar","raw_affiliation_strings":["University of Stuttgart,Germany","University of Stuttgart, Germany"],"affiliations":[{"raw_affiliation_string":"University of Stuttgart,Germany","institution_ids":["https://openalex.org/I100066346"]},{"raw_affiliation_string":"University of Stuttgart, Germany","institution_ids":["https://openalex.org/I100066346"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040257052","display_name":"Youssef Farag","orcid":"https://orcid.org/0000-0003-0106-8456"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Youssef Farag","raw_affiliation_strings":["Technical University of Munich (TUM),Germany","Technical University of Munich (TUM), Germany"],"affiliations":[{"raw_affiliation_string":"Technical University of Munich (TUM),Germany","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Technical University of Munich (TUM), Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034841183","display_name":"Tarun Yenamandra","orcid":null},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tarun Yenamandra","raw_affiliation_strings":["Technical University of Munich (TUM),Germany","Technical University of Munich (TUM), Germany"],"affiliations":[{"raw_affiliation_string":"Technical University of Munich (TUM),Germany","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Technical University of Munich (TUM), Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087710605","display_name":"Daniel Cremers","orcid":"https://orcid.org/0000-0002-3079-7984"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Daniel Cremers","raw_affiliation_strings":["Technical University of Munich (TUM),Germany","Technical University of Munich (TUM), Germany"],"affiliations":[{"raw_affiliation_string":"Technical University of Munich (TUM),Germany","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Technical University of Munich (TUM), Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044253600","display_name":"Karim Guirguis","orcid":null},"institutions":[{"id":"https://openalex.org/I889804353","display_name":"Robert Bosch (Germany)","ror":"https://ror.org/01fe0jt45","country_code":"DE","type":"company","lineage":["https://openalex.org/I889804353"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Karim Guirguis","raw_affiliation_strings":["Bosch Center for Artificial Intelligence,Renningen,Germany","Bosch Center for Artificial Intelligence, Renningen, Germany"],"affiliations":[{"raw_affiliation_string":"Bosch Center for Artificial Intelligence,Renningen,Germany","institution_ids":["https://openalex.org/I889804353"]},{"raw_affiliation_string":"Bosch Center for Artificial Intelligence, Renningen, Germany","institution_ids":["https://openalex.org/I889804353"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101717968","display_name":"Bin Yang","orcid":"https://orcid.org/0000-0002-8322-117X"},"institutions":[{"id":"https://openalex.org/I100066346","display_name":"University of Stuttgart","ror":"https://ror.org/04vnq7t77","country_code":"DE","type":"education","lineage":["https://openalex.org/I100066346"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Bin Yang","raw_affiliation_strings":["University of Stuttgart,Germany","University of Stuttgart, Germany"],"affiliations":[{"raw_affiliation_string":"University of Stuttgart,Germany","institution_ids":["https://openalex.org/I100066346"]},{"raw_affiliation_string":"University of Stuttgart, Germany","institution_ids":["https://openalex.org/I100066346"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5049254859"],"corresponding_institution_ids":["https://openalex.org/I100066346"],"apc_list":null,"apc_paid":null,"fwci":0.5943,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.68637864,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9297999739646912,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9189000129699707,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7229475975036621},{"id":"https://openalex.org/keywords/controllability","display_name":"Controllability","score":0.6716760396957397},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.6500890254974365},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6364665031433105},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6315017342567444},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5865593552589417},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5380911231040955},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5210092067718506},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.5136520266532898},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5050278306007385},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.48433101177215576},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4635635316371918},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4465409219264984},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4104645550251007},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35955846309661865},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1451522707939148},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.07642918825149536}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7229475975036621},{"id":"https://openalex.org/C48209547","wikidata":"https://www.wikidata.org/wiki/Q1331104","display_name":"Controllability","level":2,"score":0.6716760396957397},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.6500890254974365},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6364665031433105},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6315017342567444},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5865593552589417},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5380911231040955},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5210092067718506},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.5136520266532898},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5050278306007385},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.48433101177215576},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4635635316371918},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4465409219264984},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4104645550251007},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35955846309661865},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1451522707939148},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.07642918825149536},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iv55152.2023.10186698","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/iv55152.2023.10186698","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Intelligent Vehicles Symposium (IV)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7300000190734863,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W2340897893","https://openalex.org/W2487365028","https://openalex.org/W2630837129","https://openalex.org/W2781228439","https://openalex.org/W2785678896","https://openalex.org/W2804078698","https://openalex.org/W2962770929","https://openalex.org/W2962974533","https://openalex.org/W2963800363","https://openalex.org/W2981017910","https://openalex.org/W3014852036","https://openalex.org/W3034371424","https://openalex.org/W3034431451","https://openalex.org/W3035574324","https://openalex.org/W3047371217","https://openalex.org/W3107847401","https://openalex.org/W3112587064","https://openalex.org/W3118552741","https://openalex.org/W3121736286","https://openalex.org/W3174807077","https://openalex.org/W3175549255","https://openalex.org/W3177221875","https://openalex.org/W3180355996","https://openalex.org/W4200630668","https://openalex.org/W4213186350","https://openalex.org/W4214897085","https://openalex.org/W4214926101","https://openalex.org/W4285981784","https://openalex.org/W4286869901","https://openalex.org/W4287817254","https://openalex.org/W4288018050","https://openalex.org/W4294643831","https://openalex.org/W4295719664","https://openalex.org/W4313499710","https://openalex.org/W4320013936","https://openalex.org/W6745935785","https://openalex.org/W6752378368","https://openalex.org/W6767457696","https://openalex.org/W6788340828","https://openalex.org/W6788482648","https://openalex.org/W6797179183","https://openalex.org/W6803132585"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3005996785","https://openalex.org/W3014948380","https://openalex.org/W4386984417","https://openalex.org/W4210468674","https://openalex.org/W4380551139","https://openalex.org/W4317695495","https://openalex.org/W4395044357","https://openalex.org/W4287117424","https://openalex.org/W4387506531"],"abstract_inverted_index":{"A":[0,62],"promise":[1],"of":[2,59,65,71,83,120,168,227],"Generative":[3],"Adversarial":[4],"Networks":[5],"(GANs)":[6],"is":[7,34,68,175,215],"to":[8,45,123],"provide":[9,136],"cheap":[10],"photorealistic":[11],"data":[12],"for":[13,75,108],"training":[14],"and":[15,112,171,193,204,214],"validating":[16],"AI":[17],"models":[18,222],"in":[19,98,165,184,225],"autonomous":[20],"driving.":[21],"Despite":[22],"their":[23,26],"huge":[24],"success,":[25],"performance":[27],"on":[28,94,190,211,216],"complex":[29,131],"images":[30],"featuring":[31],"multiple":[32],"objects":[33],"understudied.":[35],"While":[36],"some":[37],"frameworks":[38],"produce":[39],"high-quality":[40,60],"street":[41],"scenes":[42,128,213],"with":[43,218],"little":[44],"no":[46],"control":[47,55],"over":[48],"the":[49,57,69,76,81,166,169,179,186,191,197],"image":[50,187,206],"content,":[51],"others":[52],"offer":[53],"more":[54,130,138,176,202],"at":[56],"expense":[58],"generation.":[61],"common":[63],"limitation":[64],"both":[66],"approaches":[67,210],"use":[70],"global":[72],"latent":[73,95,142,162],"codes":[74],"whole":[77],"image,":[78],"which":[79],"hinders":[80],"learning":[82],"independent":[84],"object":[85],"distributions.":[86],"Motivated":[87],"by":[88],"SemanticStyleGAN":[89],"(SSG),":[90],"a":[91,104,117,137,146],"recent":[92],"work":[93],"space":[96],"disentanglement":[97],"human":[99,133],"face":[100],"generation,":[101],"we":[102,144,158],"propose":[103],"novel":[105],"framework,":[106],"Urban-StyleGAN,":[107],"urban":[109,127,212],"scene":[110],"generation":[111],"manipulation.":[113],"We":[114],"find":[115],"that":[116,173],"straightforward":[118],"application":[119],"SSG":[121],"leads":[122],"poor":[124],"results":[125],"because":[126],"are":[129,153],"than":[132,178,208],"faces.":[134],"To":[135],"compact":[139],"yet":[140],"disentangled":[141],"representation,":[143],"develop":[145],"class":[147],"grouping":[148],"strategy":[149],"wherein":[150],"individual":[151],"classes":[152],"grouped":[154],"into":[155],"super-classes.":[156],"Moreover,":[157],"employ":[159],"an":[160],"unsupervised":[161],"exploration":[163],"algorithm":[164],"$\\mathcal{S}$-space":[167],"generator":[170],"show":[172,196],"it":[174],"efficient":[177],"conventional":[180],"${\\mathcal{W}^":[181],"+":[182],"}$-space":[183],"controlling":[185],"content.":[188],"Results":[189],"Cityscapes":[192],"Mapillary":[194],"datasets":[195],"proposed":[198],"approach":[199],"achieves":[200],"significantly":[201],"controllability":[203],"improved":[205],"quality":[207],"previous":[209],"par":[217],"general-purpose":[219],"non-controllable":[220],"generative":[221],"(like":[223],"StyleGAN2)":[224],"terms":[226],"quality.":[228]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
