{"id":"https://openalex.org/W4387785490","doi":"https://doi.org/10.1109/ispa58351.2023.10278916","title":"Optimizing Computational Complexity: Real-Time Speech Enhancement Using an Efficient Convolutional Recurrent Dense Neural Network","display_name":"Optimizing Computational Complexity: Real-Time Speech Enhancement Using an Efficient Convolutional Recurrent Dense Neural Network","publication_year":2023,"publication_date":"2023-09-18","ids":{"openalex":"https://openalex.org/W4387785490","doi":"https://doi.org/10.1109/ispa58351.2023.10278916"},"language":"en","primary_location":{"id":"doi:10.1109/ispa58351.2023.10278916","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ispa58351.2023.10278916","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 International Symposium on Image and Signal Processing and Analysis (ISPA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113027501","display_name":"Amir Rajabi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210158205","display_name":"Aschaffenburg University of Applied Sciences","ror":"https://ror.org/04sms9203","country_code":"DE","type":"education","lineage":["https://openalex.org/I4210158205"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Amir Rajabi","raw_affiliation_strings":["Aschaffenburg University of Applied Sciences,Signal Processing Laboratory,Aschaffenburg,Germany","Signal Processing Laboratory, Aschaffenburg University of Applied Sciences, Aschaffenburg, Germany"],"affiliations":[{"raw_affiliation_string":"Aschaffenburg University of Applied Sciences,Signal Processing Laboratory,Aschaffenburg,Germany","institution_ids":["https://openalex.org/I4210158205"]},{"raw_affiliation_string":"Signal Processing Laboratory, Aschaffenburg University of Applied Sciences, Aschaffenburg, Germany","institution_ids":["https://openalex.org/I4210158205"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043401097","display_name":"Mohammed Krini","orcid":null},"institutions":[{"id":"https://openalex.org/I4210158205","display_name":"Aschaffenburg University of Applied Sciences","ror":"https://ror.org/04sms9203","country_code":"DE","type":"education","lineage":["https://openalex.org/I4210158205"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Mohammed Krini","raw_affiliation_strings":["Aschaffenburg University of Applied Sciences,Signal Processing Laboratory,Aschaffenburg,Germany","Signal Processing Laboratory, Aschaffenburg University of Applied Sciences, Aschaffenburg, Germany"],"affiliations":[{"raw_affiliation_string":"Aschaffenburg University of Applied Sciences,Signal Processing Laboratory,Aschaffenburg,Germany","institution_ids":["https://openalex.org/I4210158205"]},{"raw_affiliation_string":"Signal Processing Laboratory, Aschaffenburg University of Applied Sciences, Aschaffenburg, Germany","institution_ids":["https://openalex.org/I4210158205"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5113027501"],"corresponding_institution_ids":["https://openalex.org/I4210158205"],"apc_list":null,"apc_paid":null,"fwci":0.2033,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.4594104,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.820737361907959},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.7206778526306152},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.6731839179992676},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5812406539916992},{"id":"https://openalex.org/keywords/intelligibility","display_name":"Intelligibility (philosophy)","score":0.5766991376876831},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5764581561088562},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5738479495048523},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.5078175663948059},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39067378640174866},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2167181670665741},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.1620330810546875},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.09058544039726257}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.820737361907959},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.7206778526306152},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.6731839179992676},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5812406539916992},{"id":"https://openalex.org/C60048801","wikidata":"https://www.wikidata.org/wiki/Q1433889","display_name":"Intelligibility (philosophy)","level":2,"score":0.5766991376876831},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5764581561088562},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5738479495048523},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.5078175663948059},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39067378640174866},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2167181670665741},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.1620330810546875},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.09058544039726257},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ispa58351.2023.10278916","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ispa58351.2023.10278916","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 International Symposium on Image and Signal Processing and Analysis (ISPA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W891534129","https://openalex.org/W1893870629","https://openalex.org/W2067295501","https://openalex.org/W2144404214","https://openalex.org/W2773624778","https://openalex.org/W2889442120","https://openalex.org/W2889597349","https://openalex.org/W2913481574","https://openalex.org/W2921661700","https://openalex.org/W2944985332","https://openalex.org/W2949756029","https://openalex.org/W2962866211","https://openalex.org/W2963285578","https://openalex.org/W2963446712","https://openalex.org/W2963902628","https://openalex.org/W2964058413","https://openalex.org/W2964171275","https://openalex.org/W3013382035","https://openalex.org/W3015844538","https://openalex.org/W3097627357","https://openalex.org/W3097945073","https://openalex.org/W3160129476","https://openalex.org/W3161528727","https://openalex.org/W3168779539","https://openalex.org/W3198162371","https://openalex.org/W4289242435","https://openalex.org/W4291238569","https://openalex.org/W6639428356","https://openalex.org/W6785764544"],"related_works":["https://openalex.org/W4293226380","https://openalex.org/W4321487865","https://openalex.org/W4313906399","https://openalex.org/W1630865680","https://openalex.org/W1986772939","https://openalex.org/W2037635165","https://openalex.org/W2738829087","https://openalex.org/W2542062716","https://openalex.org/W1505346162","https://openalex.org/W4200562864"],"abstract_inverted_index":{"Real-time":[0],"communication":[1],"through":[2],"cell":[3],"phones":[4],"and":[5,57,172],"telephones":[6],"often":[7],"involves":[8],"challenging":[9],"acoustic":[10],"environments":[11],"where":[12],"the":[13,24,38,77,134,170,175,184],"original":[14],"speech":[15,50,55,69,125],"signal":[16],"is":[17,105,127],"contaminated":[18],"by":[19,44],"environmental":[20],"noise,":[21],"known":[22],"as":[23],"cocktail":[25],"party":[26],"problem.":[27,91],"Audio":[28],"source":[29],"separation":[30],"can":[31,53,99],"be":[32],"an":[33],"effective":[34],"solution":[35],"for":[36,87,107,124],"isolating":[37],"voice":[39],"in":[40,68,117],"a":[41,72,120,141],"noisy":[42],"environment,":[43],"suppressing":[45],"undesired":[46],"noise":[47],"without":[48],"distorting":[49],"components,":[51],"which":[52,104,129,147],"improve":[54],"quality":[56],"intelligibility.":[58],"Deep":[59],"Neural":[60],"Network":[61],"(DNN)":[62],"models,":[63],"despite":[64],"their":[65],"excellent":[66],"performance":[67,158],"enhancement,":[70],"require":[71,111],"substantial":[73],"computational":[74,94,152],"effort":[75],"during":[76],"inference":[78],"process.":[79],"This":[80],"characteristic":[81],"makes":[82],"them":[83],"less":[84],"than":[85],"ideal":[86],"addressing":[88],"this":[89,118],"specific":[90],"The":[92,137],"high":[93],"complexity":[95],"of":[96,174,183],"deep":[97],"models":[98],"further":[100],"impede":[101],"regression":[102],"latency,":[103],"crucial":[106],"real-time":[108],"applications":[109],"that":[110],"minimized":[112],"complexity.":[113],"Considering":[114],"these":[115],"assumptions":[116],"paper,":[119],"novel":[121],"neural":[122],"network":[123,177],"enhancement":[126],"presented,":[128],"incorporates":[130],"phase":[131],"information":[132],"into":[133],"loss":[135],"function.":[136],"proposed":[138],"method":[139],"utilizes":[140],"convolutional":[142],"Recurrent":[143],"Dense":[144],"(CRD)":[145],"network,":[146],"not":[148],"only":[149],"achieves":[150],"notable":[151],"efficiency":[153],"but":[154],"also":[155],"demonstrates":[156],"superior":[157],"compared":[159,179],"to":[160,168],"other":[161],"existing":[162],"networks.":[163],"Experimental":[164],"results":[165],"are":[166],"provided":[167],"highlight":[169],"advantages":[171],"distinctions":[173],"CRD":[176],"when":[178],"with":[180],"alternative":[181],"state":[182],"art":[185],"approaches.":[186]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
