{"id":"https://openalex.org/W7154719851","doi":"https://doi.org/10.48550/arxiv.2604.14302","title":"Geometrically Consistent Multi-View Scene Generation from Freehand Sketches","display_name":"Geometrically Consistent Multi-View Scene Generation from Freehand Sketches","publication_year":2026,"publication_date":"2026-04-15","ids":{"openalex":"https://openalex.org/W7154719851","doi":"https://doi.org/10.48550/arxiv.2604.14302"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.14302","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14302","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.14302","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114111694","display_name":"Ahmed Bourouis","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bourouis, Ahmed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133891358","display_name":"Savas Ozkan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ozkan, Savas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068052561","display_name":"Andrea Maracani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maracani, Andrea","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133907505","display_name":"Yi-Zhe Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Yi-Zhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133828449","display_name":"Mete Ozay","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ozay, Mete","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5114111694"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.41920000314712524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.41920000314712524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.23649999499320984,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.1429000049829483,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.632099986076355},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5724999904632568},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5627999901771545},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.3889000117778778},{"id":"https://openalex.org/keywords/iterative-and-incremental-development","display_name":"Iterative and incremental development","score":0.3711000084877014},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.31700000166893005}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6991000175476074},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6363000273704529},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.632099986076355},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.609000027179718},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5724999904632568},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5627999901771545},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.3889000117778778},{"id":"https://openalex.org/C143587482","wikidata":"https://www.wikidata.org/wiki/Q1543216","display_name":"Iterative and incremental development","level":2,"score":0.3711000084877014},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.31700000166893005},{"id":"https://openalex.org/C543847140","wikidata":"https://www.wikidata.org/wiki/Q2642826","display_name":"Realism","level":2,"score":0.2985999882221222},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2782000005245209},{"id":"https://openalex.org/C32990609","wikidata":"https://www.wikidata.org/wiki/Q306542","display_name":"Transformation geometry","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.26570001244544983},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.26019999384880066}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.14302","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14302","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.14302","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14302","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,70],"tackle":[1],"a":[2,11,26,96,128,144,180],"new":[3],"problem:":[4],"generating":[5],"geometrically":[6,20],"consistent":[7,45],"multi-view":[8,27,54],"scenes":[9],"from":[10,83,135],"single":[12,145],"freehand":[13],"sketch.":[14],"Freehand":[15],"sketches":[16],"are":[17],"the":[18,78,123],"most":[19],"impoverished":[21],"input":[22],"one":[23],"could":[24],"offer":[25],"generator.":[28],"They":[29],"convey":[30],"scene":[31],"intent":[32],"through":[33,90],"abstract":[34],"strokes":[35],"while":[36,60,176],"introducing":[37],"spatial":[38],"distortions":[39],"that":[40,117],"actively":[41],"conflict":[42],"with":[43],"any":[44],"3D":[46],"interpretation.":[47],"No":[48],"prior":[49],"method":[50],"attempts":[51],"this;":[52],"existing":[53],"approaches":[55],"require":[56],"photographs":[57],"or":[58,66,154],"text,":[59],"sketch-to-3D":[61],"methods":[62],"need":[63,79],"multiple":[64],"views":[65,142],"costly":[67],"per-scene":[68,155],"optimisation.":[69],"address":[71],"three":[72,91],"compounding":[73],"challenges;":[74],"absent":[75],"training":[76],"data,":[77],"for":[80],"geometric":[81,119,171],"reasoning":[82],"distorted":[84],"2D":[85],"input,":[86],"and":[87,108,126,170],"cross-view":[88],"consistency,":[89],"mutually":[92],"reinforcing":[93],"contributions:":[94],"(i)":[95],"curated":[97],"dataset":[98],"of":[99],"$\\sim$9k":[100],"sketch-to-multiview":[101],"samples,":[102],"constructed":[103],"via":[104],"an":[105],"automated":[106],"generation":[107],"filtering":[109],"pipeline;":[110],"(ii)":[111],"Parallel":[112],"Camera-Aware":[113],"Attention":[114],"Adapters":[115],"(CA3)":[116],"inject":[118],"inductive":[120],"biases":[121],"into":[122],"video":[124],"transformer;":[125],"(iii)":[127],"Sparse":[129],"Correspondence":[130],"Supervision":[131],"Loss":[132],"(CSL)":[133],"derived":[134],"Structure-from-Motion":[136],"reconstructions.":[137],"Our":[138,157],"framework":[139],"synthesizes":[140],"all":[141],"in":[143],"denoising":[146],"process":[147],"without":[148],"requiring":[149],"reference":[150],"images,":[151],"iterative":[152],"refinement,":[153],"optimization.":[156],"approach":[158],"significantly":[159],"outperforms":[160],"state-of-the-art":[161],"two-stage":[162],"baselines,":[163],"improving":[164],"realism":[165],"(FID)":[166],"by":[167,174],"over":[168],"60%":[169],"consistency":[172],"(Corr-Acc)":[173],"23%,":[175],"providing":[177],"up":[178],"to":[179],"3.7$\\times$":[181],"inference":[182],"speedup.":[183]},"counts_by_year":[],"updated_date":"2026-04-18T06:05:20.339008","created_date":"2026-04-18T00:00:00"}
