{"id":"https://openalex.org/W4388430756","doi":"https://doi.org/10.1109/lsp.2023.3330124","title":"Lite-RTSE: Exploring a Cost-Effective Lite DNN Model for Real-Time Speech Enhancement in RTC Scenarios","display_name":"Lite-RTSE: Exploring a Cost-Effective Lite DNN Model for Real-Time Speech Enhancement in RTC Scenarios","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4388430756","doi":"https://doi.org/10.1109/lsp.2023.3330124"},"language":"en","primary_location":{"id":"doi:10.1109/lsp.2023.3330124","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/lsp.2023.3330124","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008366157","display_name":"Xingwei Liang","orcid":"https://orcid.org/0000-0002-5940-3440"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]},{"id":"https://openalex.org/I4210093050","display_name":"Konka (China)","ror":"https://ror.org/00qa3c235","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210093050"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xingwei Liang","raw_affiliation_strings":["Harbin Institute of Technology and Konka Group Company, Ltd., Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology and Konka Group Company, Ltd., Shenzhen, China","institution_ids":["https://openalex.org/I4210093050","https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100388629","display_name":"Lu Zhang","orcid":"https://orcid.org/0000-0002-3469-2899"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lu Zhang","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102869280","display_name":"Zhiyong Wu","orcid":"https://orcid.org/0000-0001-8533-0524"},"institutions":[{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Wu","raw_affiliation_strings":["Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026719663","display_name":"Ruifeng Xu","orcid":"https://orcid.org/0000-0002-4009-5679"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruifeng Xu","raw_affiliation_strings":["Harbin Institute of Technology, Peng Cheng Laboratory, and Guangdong Provincial Key Laboratory of Novel Security Intelligence Technologies, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Peng Cheng Laboratory, and Guangdong Provincial Key Laboratory of Novel Security Intelligence Technologies, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793","https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5008366157"],"corresponding_institution_ids":["https://openalex.org/I204983213","https://openalex.org/I4210093050"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.15455399,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"30","issue":null,"first_page":"1697","last_page":"1701"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10326","display_name":"Indoor and Outdoor Localization Technologies","score":0.9726999998092651,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.8329044580459595},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7082734704017639},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5748577117919922},{"id":"https://openalex.org/keywords/monaural","display_name":"Monaural","score":0.5033039450645447},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.4927869141101837},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.474984347820282},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3007674217224121},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2742993235588074}],"concepts":[{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.8329044580459595},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7082734704017639},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5748577117919922},{"id":"https://openalex.org/C102894143","wikidata":"https://www.wikidata.org/wiki/Q1323979","display_name":"Monaural","level":2,"score":0.5033039450645447},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.4927869141101837},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.474984347820282},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3007674217224121},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2742993235588074}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lsp.2023.3330124","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/lsp.2023.3330124","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.5600000023841858,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G6312846351","display_name":null,"funder_award_id":"62176076","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8139119493","display_name":null,"funder_award_id":"2023A1515012922","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1482149378","https://openalex.org/W1552314771","https://openalex.org/W1924770834","https://openalex.org/W1993195403","https://openalex.org/W2051428568","https://openalex.org/W2097117768","https://openalex.org/W2127851351","https://openalex.org/W2133564696","https://openalex.org/W2141411743","https://openalex.org/W2141998673","https://openalex.org/W2219249508","https://openalex.org/W2603567530","https://openalex.org/W2678916739","https://openalex.org/W2889048668","https://openalex.org/W2889442120","https://openalex.org/W2914067823","https://openalex.org/W2948116732","https://openalex.org/W2952979007","https://openalex.org/W2962793908","https://openalex.org/W2963103134","https://openalex.org/W2963868408","https://openalex.org/W2972404066","https://openalex.org/W2991361823","https://openalex.org/W2998445964","https://openalex.org/W3027637851","https://openalex.org/W3031505850","https://openalex.org/W3095248373","https://openalex.org/W3096408984","https://openalex.org/W3097817799","https://openalex.org/W3103034221","https://openalex.org/W3119316801","https://openalex.org/W3161140524","https://openalex.org/W3164605550","https://openalex.org/W3174609245","https://openalex.org/W3197042120","https://openalex.org/W3198680319","https://openalex.org/W3213188934","https://openalex.org/W4221149546","https://openalex.org/W4225323964","https://openalex.org/W4226185896","https://openalex.org/W4232282348","https://openalex.org/W4297841575","https://openalex.org/W6640212811","https://openalex.org/W6679434410","https://openalex.org/W6688816777","https://openalex.org/W6754473786","https://openalex.org/W6777701575"],"related_works":["https://openalex.org/W2036157531","https://openalex.org/W2401567014","https://openalex.org/W2889698889","https://openalex.org/W2538939196","https://openalex.org/W3045520545","https://openalex.org/W2770665941","https://openalex.org/W3096184950","https://openalex.org/W4231424160","https://openalex.org/W2275432853","https://openalex.org/W197907117"],"abstract_inverted_index":{"The":[0],"noise":[1],"reduction":[2],"performance":[3,122],"of":[4,21,46,96,106],"DNN-based":[5],"monaural":[6],"speech":[7,39,63,73,120],"enhancement":[8,40,64,74],"(SE)":[9],"methods":[10,41],"has":[11,24],"been":[12,26],"significantly":[13],"improved":[14],"in":[15],"recent":[16],"years,":[17],"while":[18,128],"the":[19,22,77],"complexity":[20],"model":[23,55,70,114],"also":[25],"increased":[27],"several":[28],"times.":[29],"Therefore,":[30],"it":[31],"is":[32,115],"highly":[33],"desirable":[34],"to":[35,101,117],"explore":[36],"more":[37],"\u2018cost-effective\u2019":[38],"for":[42],"a":[43,60,85],"wider":[44],"range":[45],"hardware":[47],"platforms.":[48],"In":[49],"this":[50],"letter,":[51],"we":[52],"investigate":[53],"low-cost":[54],"design":[56],"strategies":[57],"and":[58,84,104],"propose":[59],"lite":[61],"real-time":[62,68],"(Lite-RTSE)":[65],"model.":[66],"This":[67],"SE":[69,126],"achieves":[71],"efficient":[72],"by":[75],"leveraging":[76],"low-dimensional":[78],"long":[79],"short-term":[80],"memory":[81],"(LSTM)":[82],"units":[83],"novel":[86],"multi-order":[87],"convolution":[88],"block.":[89],"A":[90],"two-stage":[91],"complex":[92],"spectrum":[93],"reconstruction":[94],"scheme":[95],"\u2018masking":[97],"+":[98],"residual\u2019":[99],"contributes":[100],"better":[102],"quality":[103],"intelligibility":[105],"enhanced":[107],"speech.":[108],"Experimental":[109],"results":[110],"show":[111],"that":[112],"Lite-RTSE":[113],"able":[116],"achieve":[118],"competitive":[119],"denoising":[121],"compared":[123],"with":[124],"state-of-the-art":[125],"models,":[127],"only":[129],"containing":[130],"1.56":[131],"M":[132],"parameters":[133],"at":[134],"0.55":[135],"G":[136],"multiply-accumulate":[137],"operations":[138],"per":[139],"second":[140],"(MAC/S).":[141]},"counts_by_year":[],"updated_date":"2025-12-25T23:11:45.687758","created_date":"2025-10-10T00:00:00"}
