{"id":"https://openalex.org/W7154188911","doi":"https://doi.org/10.1145/3772318.3790870","title":"SoundStager: Interactive Design of Story-Driven GenAI Soundscapes for Video","display_name":"SoundStager: Interactive Design of Story-Driven GenAI Soundscapes for Video","publication_year":2026,"publication_date":"2026-04-13","ids":{"openalex":"https://openalex.org/W7154188911","doi":"https://doi.org/10.1145/3772318.3790870"},"language":null,"primary_location":{"id":"doi:10.1145/3772318.3790870","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3772318.3790870","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3772318.3790870","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087116106","display_name":"Suhyeon Yoo","orcid":"https://orcid.org/0000-0001-6098-9947"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Suhyeon Yoo","raw_affiliation_strings":["Computer Science, University of Toronto, Toronto, Ontario, Canada"],"raw_orcid":"https://orcid.org/0000-0001-6098-9947","affiliations":[{"raw_affiliation_string":"Computer Science, University of Toronto, Toronto, Ontario, Canada","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133532924","display_name":"Adolfo Hernandez Santisteban","orcid":"https://orcid.org/0009-0001-4545-1441"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Adolfo Hernandez Santisteban","raw_affiliation_strings":["Adobe, Seattle, Washington, USA"],"raw_orcid":"https://orcid.org/0009-0001-4545-1441","affiliations":[{"raw_affiliation_string":"Adobe, Seattle, Washington, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023673004","display_name":"Prem Seetharaman","orcid":null},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Prem Seetharaman","raw_affiliation_strings":["Adobe Research, Sacramento, California, USA"],"raw_orcid":"https://orcid.org/0009-0008-9813-0992","affiliations":[{"raw_affiliation_string":"Adobe Research, Sacramento, California, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037548450","display_name":"Justin Salamon","orcid":"https://orcid.org/0000-0001-6345-4593"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Justin Salamon","raw_affiliation_strings":["Adobe Research, San Francisco, California, USA"],"raw_orcid":"https://orcid.org/0000-0001-6345-4593","affiliations":[{"raw_affiliation_string":"Adobe Research, San Francisco, California, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110542743","display_name":"Oriol Nieto","orcid":null},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Oriol Nieto","raw_affiliation_strings":["Adobe Research, San Francisco, California, USA"],"raw_orcid":"https://orcid.org/0000-0001-6459-7609","affiliations":[{"raw_affiliation_string":"Adobe Research, San Francisco, California, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5097660143","display_name":"Anh Truong","orcid":"https://orcid.org/0009-0005-5409-7287"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anh Truong","raw_affiliation_strings":["Adobe Research, New York, New York, USA"],"raw_orcid":"https://orcid.org/0009-0005-5409-7287","affiliations":[{"raw_affiliation_string":"Adobe Research, New York, New York, USA","institution_ids":["https://openalex.org/I1306409833"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.53332536,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.4140999913215637,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.4140999913215637,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10803","display_name":"Innovative Human-Technology Interaction","score":0.179299995303154,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10914","display_name":"Tactile and Sensory Interactions","score":0.10849999636411667,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/soundscape","display_name":"Soundscape","score":0.9258000254631042},{"id":"https://openalex.org/keywords/sound-design","display_name":"Sound design","score":0.6432999968528748},{"id":"https://openalex.org/keywords/formative-assessment","display_name":"Formative assessment","score":0.5723999738693237},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5716999769210815},{"id":"https://openalex.org/keywords/interactive-storytelling","display_name":"Interactive storytelling","score":0.5080999732017517},{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.48660001158714294},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.4763000011444092},{"id":"https://openalex.org/keywords/storytelling","display_name":"Storytelling","score":0.4690999984741211}],"concepts":[{"id":"https://openalex.org/C142795923","wikidata":"https://www.wikidata.org/wiki/Q1358257","display_name":"Soundscape","level":3,"score":0.9258000254631042},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6524999737739563},{"id":"https://openalex.org/C499572226","wikidata":"https://www.wikidata.org/wiki/Q1937950","display_name":"Sound design","level":3,"score":0.6432999968528748},{"id":"https://openalex.org/C42525527","wikidata":"https://www.wikidata.org/wiki/Q1209955","display_name":"Formative assessment","level":2,"score":0.5723999738693237},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5716999769210815},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.510200023651123},{"id":"https://openalex.org/C2779754051","wikidata":"https://www.wikidata.org/wiki/Q2903135","display_name":"Interactive storytelling","level":4,"score":0.5080999732017517},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5072000026702881},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.48660001158714294},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.4763000011444092},{"id":"https://openalex.org/C2776538412","wikidata":"https://www.wikidata.org/wiki/Q989963","display_name":"Storytelling","level":3,"score":0.4690999984741211},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.3637999892234802},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.33500000834465027},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3294999897480011},{"id":"https://openalex.org/C13854087","wikidata":"https://www.wikidata.org/wiki/Q1061656","display_name":"Interaction design","level":2,"score":0.3001999855041504},{"id":"https://openalex.org/C2776566319","wikidata":"https://www.wikidata.org/wiki/Q3495514","display_name":"Interactive video","level":2,"score":0.2883000075817108},{"id":"https://openalex.org/C203004452","wikidata":"https://www.wikidata.org/wiki/Q1186952","display_name":"Interactive media","level":2,"score":0.28209999203681946},{"id":"https://openalex.org/C106246047","wikidata":"https://www.wikidata.org/wiki/Q4928435","display_name":"Iterative design","level":3,"score":0.2615000009536743},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.25440001487731934},{"id":"https://openalex.org/C2780544925","wikidata":"https://www.wikidata.org/wiki/Q569874","display_name":"Surround sound","level":3,"score":0.25360000133514404},{"id":"https://openalex.org/C33276779","wikidata":"https://www.wikidata.org/wiki/Q1943363","display_name":"Design elements and principles","level":2,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3772318.3790870","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3772318.3790870","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3772318.3790870","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3772318.3790870","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W1493418801","https://openalex.org/W2058733260","https://openalex.org/W2065211088","https://openalex.org/W2078118823","https://openalex.org/W2121277371","https://openalex.org/W2537196324","https://openalex.org/W2602896535","https://openalex.org/W2737697117","https://openalex.org/W2794878841","https://openalex.org/W2913752531","https://openalex.org/W2950504429","https://openalex.org/W2963807156","https://openalex.org/W3007605881","https://openalex.org/W3016916278","https://openalex.org/W3031000691","https://openalex.org/W3046890131","https://openalex.org/W3093732029","https://openalex.org/W3187009280","https://openalex.org/W4225126561","https://openalex.org/W4247639588","https://openalex.org/W4285051996","https://openalex.org/W4297536219","https://openalex.org/W4307475423","https://openalex.org/W4309618065","https://openalex.org/W4360991782","https://openalex.org/W4367359628","https://openalex.org/W4386071828","https://openalex.org/W4386076291","https://openalex.org/W4387801088","https://openalex.org/W4392909615","https://openalex.org/W4395443690","https://openalex.org/W4396832253","https://openalex.org/W4396833556","https://openalex.org/W4402111756","https://openalex.org/W4403653559","https://openalex.org/W4403791239","https://openalex.org/W4403791956","https://openalex.org/W4404037650","https://openalex.org/W4408352247","https://openalex.org/W4408573818","https://openalex.org/W4408860855","https://openalex.org/W4409364205","https://openalex.org/W4409367203","https://openalex.org/W4409720701","https://openalex.org/W4409735460","https://openalex.org/W4409736191","https://openalex.org/W4409746660","https://openalex.org/W4409749602","https://openalex.org/W4409888070","https://openalex.org/W4410857264","https://openalex.org/W4412035836","https://openalex.org/W4413144830","https://openalex.org/W4413720412","https://openalex.org/W7084094831"],"related_works":[],"abstract_inverted_index":{"Sound":[0],"effects":[1],"(SFX)":[2],"are":[3],"critical":[4],"to":[5,27,34,43,51,82,139],"video":[6,80,119,132],"storytelling":[7],"by":[8,110],"immersing":[9],"viewers,":[10],"directing":[11],"attention,":[12],"and":[13,31,56,91,94,103,121],"shaping":[14],"emotion.":[15],"However,":[16],"crafting":[17],"an":[18,68],"effective":[19],"soundscape":[20],"is":[21],"difficult:":[22],"creators":[23,48,133],"must":[24],"decide":[25],"how":[26],"source,":[28],"place,":[29],"layer,":[30],"mix":[32],"sounds":[33,53],"support":[35],"the":[36,79],"narrative.":[37],"Generative":[38],"text-to-SFX":[39],"tools":[40],"enable":[41],"users":[42,138],"create":[44,83,141],"custom":[45],"sounds,":[46],"but":[47],"often":[49],"struggle":[50],"describe":[52],"with":[54,113,130],"words":[55],"lack":[57],"control":[58],"over":[59],"individual":[60],"stems":[61],"in":[62],"premixed":[63],"outputs.":[64],"We":[65],"propose":[66],"SoundStager,":[67],"AI-assisted":[69],"tool":[70],"for":[71,75],"designing":[72],"generative":[73],"soundscapes":[74,143],"video.":[76],"SoundStager":[77,136],"analyzes":[78],"narrative":[81],"layered":[84],"audio":[85],"scenes":[86],"(of":[87],"keynote,":[88],"signal,":[89],"soundmark,":[90],"archetypal":[92],"sounds)":[93],"supports":[95],"iterative":[96],"refinement":[97],"through":[98],"a":[99],"combination":[100],"of":[101],"conversational":[102],"analog":[104],"controls.":[105],"SoundStager\u2019s":[106],"design":[107,125],"was":[108],"informed":[109],"formative":[111],"studies":[112],"six":[114,118],"professional":[115],"sound":[116,124],"designers,":[117],"creators,":[120],"insights":[122],"from":[123],"literature.":[126],"Our":[127],"user":[128],"evaluation":[129],"twelve":[131],"shows":[134],"that":[135],"enables":[137],"quickly":[140],"satisfactory":[142],"while":[144],"retaining":[145],"creative":[146],"control.":[147]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-14T00:00:00"}
