{"id":"https://openalex.org/W7133314614","doi":"https://doi.org/10.48550/arxiv.2603.00395","title":"Fine-grained Soundscape Control for Augmented Hearing","display_name":"Fine-grained Soundscape Control for Augmented Hearing","publication_year":2026,"publication_date":"2026-02-28","ids":{"openalex":"https://openalex.org/W7133314614","doi":"https://doi.org/10.48550/arxiv.2603.00395"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.00395","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00395","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.00395","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127969858","display_name":"Seunghyun Oh","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Oh, Seunghyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035670633","display_name":"Malek Itani","orcid":"https://orcid.org/0009-0002-7249-2641"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Itani, Malek","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127908083","display_name":"Aseem Gauri","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gauri, Aseem","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5011077730","display_name":"Shyamnath Gollakota","orcid":"https://orcid.org/0000-0002-9863-3054"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gollakota, Shyamnath","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5127969858"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.4950000047683716,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.4950000047683716,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.41620001196861267,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.025699999183416367,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/soundscape","display_name":"Soundscape","score":0.9059000015258789},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6133999824523926},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5026999711990356},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.47540000081062317},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.47279998660087585},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.4041999876499176},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.3944000005722046},{"id":"https://openalex.org/keywords/noise-control","display_name":"Noise control","score":0.3677999973297119}],"concepts":[{"id":"https://openalex.org/C142795923","wikidata":"https://www.wikidata.org/wiki/Q1358257","display_name":"Soundscape","level":3,"score":0.9059000015258789},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6854000091552734},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6133999824523926},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5246999859809875},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5026999711990356},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.47540000081062317},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.47279998660087585},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.4041999876499176},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.3944000005722046},{"id":"https://openalex.org/C116822448","wikidata":"https://www.wikidata.org/wiki/Q1879301","display_name":"Noise control","level":3,"score":0.3677999973297119},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.34310001134872437},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.32519999146461487},{"id":"https://openalex.org/C98025372","wikidata":"https://www.wikidata.org/wiki/Q477538","display_name":"Systems architecture","level":3,"score":0.3228999972343445},{"id":"https://openalex.org/C100675267","wikidata":"https://www.wikidata.org/wiki/Q1371624","display_name":"Background noise","level":2,"score":0.3122999966144562},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.3077000081539154},{"id":"https://openalex.org/C205312793","wikidata":"https://www.wikidata.org/wiki/Q16002801","display_name":"Ambient noise level","level":3,"score":0.2962000072002411},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.29339998960494995},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.2906000018119812},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2782000005245209},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.27630001306533813},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.26460000872612},{"id":"https://openalex.org/C89505385","wikidata":"https://www.wikidata.org/wiki/Q47146","display_name":"User interface","level":2,"score":0.25209999084472656},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.00395","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00395","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.00395","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00395","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Hearables":[0],"are":[1],"becoming":[2],"ubiquitous,":[3],"yet":[4],"their":[5,99],"sound":[6,68,146],"controls":[7],"remain":[8],"blunt:":[9],"users":[10,33,97],"can":[11],"either":[12],"enable":[13],"global":[14],"noise":[15],"suppression":[16],"or":[17],"focus":[18],"on":[19,51,125],"a":[20,61,72,169],"single":[21],"target":[22,93],"sound.":[23],"Real-world":[24],"acoustic":[25],"scenes,":[26],"however,":[27],"contain":[28],"many":[29],"simultaneous":[30],"sources":[31],"that":[32,64,78,161],"may":[34],"want":[35],"to":[36,45],"adjust":[37],"independently.":[38],"We":[39,112],"introduce":[40],"Aurchestra,":[41,174],"the":[42,114,162,175],"first":[43],"system":[44,55,142],"provide":[46],"fine-grained,":[47],"real-time":[48,123],"soundscape":[49,176],"control":[50,147],"resource-constrained":[52],"hearables.":[53],"Our":[54,158],"has":[56],"two":[57],"key":[58],"components:":[59],"(1)":[60],"dynamic":[62],"interface":[63],"surfaces":[65],"only":[66],"active":[67],"classes":[69],"and":[70,95,121,138,148,155],"(2)":[71],"real-time,":[73],"on-device":[74],"multi-output":[75],"extraction":[76],"network":[77],"generates":[79],"separate":[80],"streams":[81],"for":[82,89,117],"each":[83],"selected":[84],"class,":[85],"achieving":[86],"robust":[87],"performance":[88,124],"upto":[90],"5":[91],"overlapping":[92],"sounds,":[94],"letting":[96],"mix":[98],"environment":[100],"by":[101],"customizing":[102],"per-class":[103,145],"volumes,":[104],"much":[105],"like":[106],"an":[107],"audio":[108,129],"engineer":[109],"mixes":[110],"tracks.":[111],"optimize":[113],"model":[115],"architecture":[116],"multiple":[118],"compute-limited":[119],"platforms":[120],"demonstrate":[122],"6":[126],"ms":[127],"streaming":[128],"chunks.":[130],"Across":[131],"real-world":[132],"environments":[133],"in":[134,152],"previously":[135],"unseen":[136],"indoor":[137],"outdoor":[139],"scenarios,":[140],"our":[141],"enables":[143],"expressive":[144],"achieves":[149],"substantial":[150],"improvements":[151],"target-class":[153],"enhancement":[154],"interference":[156],"suppression.":[157],"results":[159],"show":[160],"world":[163],"need":[164],"not":[165],"be":[166],"heard":[167],"as":[168],"single,":[170],"undifferentiated":[171],"stream:":[172],"with":[173],"becomes":[177],"truly":[178],"programmable.":[179]},"counts_by_year":[],"updated_date":"2026-03-07T13:37:22.277990","created_date":"2026-03-04T00:00:00"}
