{"id":"https://openalex.org/W7139951097","doi":"https://doi.org/10.1016/j.procs.2026.01.069","title":"Reinforcement-Learned Speech Enhancement Models for Real-Time Adaptive Human-Computer Interaction","display_name":"Reinforcement-Learned Speech Enhancement Models for Real-Time Adaptive Human-Computer Interaction","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7139951097","doi":"https://doi.org/10.1016/j.procs.2026.01.069"},"language":"en","primary_location":{"id":"doi:10.1016/j.procs.2026.01.069","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.069","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1016/j.procs.2026.01.069","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072998243","display_name":"Bidoor Noori Ishaq","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145266","display_name":"Southern Technical University","ror":"https://ror.org/03sax3264","country_code":"IQ","type":"education","lineage":["https://openalex.org/I4210145266"]}],"countries":["IQ"],"is_corresponding":false,"raw_author_name":"Bidoor Noori Ishaq","raw_affiliation_strings":["Department of Cybersecurity science, Al Kunooze University College of Technical Engineering, Basrah, Iraq"],"affiliations":[{"raw_affiliation_string":"Department of Cybersecurity science, Al Kunooze University College of Technical Engineering, Basrah, Iraq","institution_ids":["https://openalex.org/I4210145266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130225992","display_name":"Naji Mutar Saheb","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145266","display_name":"Southern Technical University","ror":"https://ror.org/03sax3264","country_code":"IQ","type":"education","lineage":["https://openalex.org/I4210145266"]}],"countries":["IQ"],"is_corresponding":false,"raw_author_name":"Naji Mutar Saheb","raw_affiliation_strings":["Department of Cybersecurity science, Al Kunooze University College of Technical Engineering, Basrah, Iraq"],"affiliations":[{"raw_affiliation_string":"Department of Cybersecurity science, Al Kunooze University College of Technical Engineering, Basrah, Iraq","institution_ids":["https://openalex.org/I4210145266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130246876","display_name":"Aay Muwafaq Ismael","orcid":null},"institutions":[{"id":"https://openalex.org/I45998257","display_name":"Sohar University","ror":"https://ror.org/02ftvf862","country_code":"OM","type":"education","lineage":["https://openalex.org/I45998257"]}],"countries":["OM"],"is_corresponding":false,"raw_author_name":"Aay Muwafaq Ismael","raw_affiliation_strings":["College of Computing and IT, University of Technology and Applied Sciences, Suhar, Oman"],"affiliations":[{"raw_affiliation_string":"College of Computing and IT, University of Technology and Applied Sciences, Suhar, Oman","institution_ids":["https://openalex.org/I45998257"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5130227408","display_name":"Maen Qaddoura","orcid":null},"institutions":[{"id":"https://openalex.org/I45998257","display_name":"Sohar University","ror":"https://ror.org/02ftvf862","country_code":"OM","type":"education","lineage":["https://openalex.org/I45998257"]}],"countries":["OM"],"is_corresponding":true,"raw_author_name":"Maen Qaddoura","raw_affiliation_strings":["College of Computing and IT, University of Technology and Applied Sciences, Suhar, Oman"],"affiliations":[{"raw_affiliation_string":"College of Computing and IT, University of Technology and Applied Sciences, Suhar, Oman","institution_ids":["https://openalex.org/I45998257"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5130227408"],"corresponding_institution_ids":["https://openalex.org/I45998257"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.94825766,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":"275","issue":null,"first_page":"594","last_page":"601"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.6225000023841858,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.6225000023841858,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.12449999898672104,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.04960000142455101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.6980000138282776},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.29179999232292175},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.28119999170303345},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.2768000066280365},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.27300000190734863}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9081000089645386},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.6980000138282776},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5569999814033508},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4269999861717224},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.28119999170303345},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.2768000066280365},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.27300000190734863},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C2986800882","wikidata":"https://www.wikidata.org/wiki/Q7168187","display_name":"Performance enhancement","level":2,"score":0.25769999623298645}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.procs.2026.01.069","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.069","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.procs.2026.01.069","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.069","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W3111240127","https://openalex.org/W3210350108","https://openalex.org/W4210475104","https://openalex.org/W4285389493","https://openalex.org/W4297904486","https://openalex.org/W4304013688","https://openalex.org/W4321437640","https://openalex.org/W4322731291","https://openalex.org/W4323309956","https://openalex.org/W4362006149","https://openalex.org/W4367055146","https://openalex.org/W4367627627","https://openalex.org/W4380434618","https://openalex.org/W4385067602","https://openalex.org/W4385701164","https://openalex.org/W4385800720","https://openalex.org/W4387587611","https://openalex.org/W4387805930","https://openalex.org/W4388107429","https://openalex.org/W4388679725","https://openalex.org/W4389719868","https://openalex.org/W4390362839","https://openalex.org/W4390506533","https://openalex.org/W4390547023","https://openalex.org/W4391431903","https://openalex.org/W4392854048","https://openalex.org/W4394895982","https://openalex.org/W4395447416","https://openalex.org/W4395675494","https://openalex.org/W4396553703","https://openalex.org/W4396601469","https://openalex.org/W4396680728","https://openalex.org/W4398185455","https://openalex.org/W4398193181","https://openalex.org/W4399457811","https://openalex.org/W4399468713","https://openalex.org/W4400526454","https://openalex.org/W4400733770","https://openalex.org/W4402672259","https://openalex.org/W4402787888","https://openalex.org/W4402877857","https://openalex.org/W4403104615","https://openalex.org/W4403111444","https://openalex.org/W4403938537"],"related_works":[],"abstract_inverted_index":{"Virtual":[0],"assistants,":[1],"teleconferencing,":[2],"and":[3,31,52,87,125,132,139,150],"assistive":[4],"technologies":[5],"utilize":[6],"real-time":[7,126,152],"speech":[8,13,111,153],"augmentation.":[9],"Traditional":[10],"deep":[11,61],"learning-based":[12],"augmentation":[14,154],"methods":[15],"often":[16],"yield":[17],"inferior":[18],"voice":[19,67],"quality":[20,112],"in":[21,70,137,141,143],"real-world":[22],"scenarios":[23],"due":[24],"to":[25,33,35,49,118],"their":[26],"reliance":[27],"on":[28],"static":[29],"parameters":[30],"inability":[32],"adapt":[34],"dynamic":[36],"acoustic":[37],"conditions.":[38],"This":[39],"paper":[40],"recommends":[41],"RL-SEM,":[42],"which":[43],"combines":[44],"RL":[45,56,92],"with":[46],"adaptive":[47,151],"optimization":[48],"improve":[50],"intelligibility":[51],"reduce":[53],"noise.":[54],"An":[55],"agent":[57],"led":[58],"by":[59,135],"a":[60],"neural":[62],"network":[63],"may":[64],"dynamically":[65],"adjust":[66],"enhancement":[68],"settings":[69],"the":[71],"proposed":[72],"framework":[73],"using":[74,99],"contextual":[75],"information.":[76],"The":[77],"Firefly":[78],"Algorithm":[79],"(FA)":[80],"improves":[81,156],"learning":[82],"stability,":[83],"convergence,":[84],"policy":[85],"exploration,":[86],"strong":[88],"adaptation":[89],"while":[90],"optimizing":[91],"hyperparameters.":[93],"A":[94],"reward":[95],"function":[96],"is":[97],"created":[98],"an":[100],"objective":[101,116],"metric,":[102],"such":[103],"as":[104],"signal-to-noise":[105],"ratio":[106],"(SNR),":[107],"perceptual":[108],"evaluation":[109],"of":[110,145],"(PESQ),":[113],"or":[114],"short-time":[115],"intelligibility,":[117],"generate":[119],"realistic":[120],"speech.":[121],"In":[122],"stationary,":[123],"non-stationary,":[124],"noisy":[127],"situations,":[128],"RL-SEM":[129],"outperforms":[130],"DNN":[131],"spectral":[133],"subtraction":[134],"22%":[136],"PESQ":[138],"16%":[140],"STOI":[142],"terms":[144],"latency.":[146],"Finally,":[147],"RL-SEM\u2019s":[148],"flexible":[149],"architecture":[155],"next-gen":[157],"HCI":[158],"applications.":[159]},"counts_by_year":[],"updated_date":"2026-03-22T06:25:25.174409","created_date":"2026-03-21T00:00:00"}
