{"id":"https://openalex.org/W4312414357","doi":"https://doi.org/10.1109/access.2022.3228744","title":"A Compact CNN-Based Speech Enhancement With Adaptive Filter Design Using Gabor Function and Region-Aware Convolution","display_name":"A Compact CNN-Based Speech Enhancement With Adaptive Filter Design Using Gabor Function and Region-Aware Convolution","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4312414357","doi":"https://doi.org/10.1109/access.2022.3228744"},"language":"en","primary_location":{"id":"doi:10.1109/access.2022.3228744","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2022.3228744","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09982431.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09982431.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053977633","display_name":"Salinna Abdullah","orcid":"https://orcid.org/0000-0003-0092-3190"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Salinna Abdullah","raw_affiliation_strings":["Department of Electronic and Electrical Engineering, University College London (UCL), London, U.K","Department of Electronic and Electrical Engineering, University College London (UCL), Torrington Place, London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Electrical Engineering, University College London (UCL), London, U.K","institution_ids":["https://openalex.org/I45129253"]},{"raw_affiliation_string":"Department of Electronic and Electrical Engineering, University College London (UCL), Torrington Place, London, UK","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107978005","display_name":"Majid Zamani","orcid":"https://orcid.org/0000-0002-8986-757X"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Majid Zamani","raw_affiliation_strings":["Department of Electronic and Electrical Engineering, University College London (UCL), London, U.K","Department of Electronic and Electrical Engineering, University College London (UCL), Torrington Place, London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Electrical Engineering, University College London (UCL), London, U.K","institution_ids":["https://openalex.org/I45129253"]},{"raw_affiliation_string":"Department of Electronic and Electrical Engineering, University College London (UCL), Torrington Place, London, UK","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012493816","display_name":"Andreas Demosthenous","orcid":"https://orcid.org/0000-0003-0623-963X"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andreas Demosthenous","raw_affiliation_strings":["Department of Electronic and Electrical Engineering, University College London (UCL), London, U.K","Department of Electronic and Electrical Engineering, University College London (UCL), Torrington Place, London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Electrical Engineering, University College London (UCL), London, U.K","institution_ids":["https://openalex.org/I45129253"]},{"raw_affiliation_string":"Department of Electronic and Electrical Engineering, University College London (UCL), Torrington Place, London, UK","institution_ids":["https://openalex.org/I45129253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5053977633"],"corresponding_institution_ids":["https://openalex.org/I45129253"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.4469,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.60131755,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"10","issue":null,"first_page":"130657","last_page":"130671"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.7550712823867798},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7254011631011963},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.5716953873634338},{"id":"https://openalex.org/keywords/gabor-filter","display_name":"Gabor filter","score":0.5297858715057373},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5153024196624756},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.47355949878692627},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44695600867271423},{"id":"https://openalex.org/keywords/circular-convolution","display_name":"Circular convolution","score":0.4413212239742279},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4300917088985443},{"id":"https://openalex.org/keywords/adaptive-filter","display_name":"Adaptive filter","score":0.4252588152885437},{"id":"https://openalex.org/keywords/overlap\u2013add-method","display_name":"Overlap\u2013add method","score":0.4151996374130249},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.36931729316711426},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33167022466659546},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.26479536294937134},{"id":"https://openalex.org/keywords/fourier-transform","display_name":"Fourier transform","score":0.19400906562805176},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.185970276594162},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.17569437623023987},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.12687379121780396},{"id":"https://openalex.org/keywords/fourier-analysis","display_name":"Fourier analysis","score":0.06724336743354797}],"concepts":[{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.7550712823867798},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7254011631011963},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.5716953873634338},{"id":"https://openalex.org/C2779883129","wikidata":"https://www.wikidata.org/wiki/Q2447890","display_name":"Gabor filter","level":3,"score":0.5297858715057373},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5153024196624756},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.47355949878692627},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44695600867271423},{"id":"https://openalex.org/C194980680","wikidata":"https://www.wikidata.org/wiki/Q245450","display_name":"Circular convolution","level":5,"score":0.4413212239742279},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4300917088985443},{"id":"https://openalex.org/C102248274","wikidata":"https://www.wikidata.org/wiki/Q168388","display_name":"Adaptive filter","level":2,"score":0.4252588152885437},{"id":"https://openalex.org/C181002996","wikidata":"https://www.wikidata.org/wiki/Q1611641","display_name":"Overlap\u2013add method","level":5,"score":0.4151996374130249},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.36931729316711426},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33167022466659546},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.26479536294937134},{"id":"https://openalex.org/C102519508","wikidata":"https://www.wikidata.org/wiki/Q6520159","display_name":"Fourier transform","level":2,"score":0.19400906562805176},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.185970276594162},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.17569437623023987},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.12687379121780396},{"id":"https://openalex.org/C203024314","wikidata":"https://www.wikidata.org/wiki/Q1365258","display_name":"Fourier analysis","level":3,"score":0.06724336743354797},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C76563020","wikidata":"https://www.wikidata.org/wiki/Q4817582","display_name":"Fractional Fourier transform","level":4,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/access.2022.3228744","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2022.3228744","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09982431.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:eprints.soton.ac.uk:489270","is_oa":true,"landing_page_url":"http://doi.org/10.1109/ACCESS.2022.3228744>).","pdf_url":"https://eprints.soton.ac.uk/489270/1/A_Compact_CNN-Based_Speech_Enhancement_With_Adaptive_Filter_Design_Using_Gabor_Function_and_Region-Aware_Convolution.pdf","source":{"id":"https://openalex.org/S4306401019","display_name":"ePrints Soton (University of Southampton)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I43439940","host_organization_name":"University of Southampton","host_organization_lineage":["https://openalex.org/I43439940"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"},{"id":"pmh:oai:doaj.org/article:f896bb4897bb46d68283e3eb5b9ec604","is_oa":true,"landing_page_url":"https://doaj.org/article/f896bb4897bb46d68283e3eb5b9ec604","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 10, Pp 130657-130671 (2022)","raw_type":"article"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10162098","is_oa":false,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10162098/","pdf_url":null,"source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"   IEEE Access , 10    pp. 130657-130671.   (2022)      ","raw_type":"Article"}],"best_oa_location":{"id":"doi:10.1109/access.2022.3228744","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2022.3228744","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09982431.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.6100000143051147,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G192619431","display_name":null,"funder_award_id":"EP/R512400/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4312414357.pdf","grobid_xml":"https://content.openalex.org/works/W4312414357.grobid-xml"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W44815768","https://openalex.org/W1552314771","https://openalex.org/W1635512741","https://openalex.org/W1782480827","https://openalex.org/W1974387177","https://openalex.org/W2030937226","https://openalex.org/W2042407743","https://openalex.org/W2044893557","https://openalex.org/W2054139811","https://openalex.org/W2102372511","https://openalex.org/W2102898380","https://openalex.org/W2114174754","https://openalex.org/W2141411743","https://openalex.org/W2141998673","https://openalex.org/W2165630397","https://openalex.org/W2194775991","https://openalex.org/W2516342150","https://openalex.org/W2889717020","https://openalex.org/W2936689732","https://openalex.org/W2937484199","https://openalex.org/W2943554574","https://openalex.org/W2950448225","https://openalex.org/W2963103134","https://openalex.org/W2978822655","https://openalex.org/W2981609494","https://openalex.org/W3015278429","https://openalex.org/W3090641261","https://openalex.org/W3095737053","https://openalex.org/W3112103486","https://openalex.org/W3127931870","https://openalex.org/W3134695619","https://openalex.org/W3147539069","https://openalex.org/W3186033197","https://openalex.org/W3210597831","https://openalex.org/W4206734304","https://openalex.org/W4223440121","https://openalex.org/W6637373629","https://openalex.org/W6723181079"],"related_works":["https://openalex.org/W3106959200","https://openalex.org/W2133280289","https://openalex.org/W2267589039","https://openalex.org/W2382152453","https://openalex.org/W1796097737","https://openalex.org/W2126886659","https://openalex.org/W2385700956","https://openalex.org/W2368932764","https://openalex.org/W2361284596","https://openalex.org/W2544310281"],"abstract_inverted_index":{"Speech":[0],"enhancement":[1],"(SE)":[2],"is":[3],"used":[4],"in":[5,24,203,214],"many":[6],"applications,":[7],"such":[8],"as":[9,87],"hearing":[10],"devices,":[11],"to":[12,68,140,145,234],"improve":[13],"speech":[14,106,222,236],"intelligibility":[15,217],"and":[16,55,125,159,198,212,225,244],"quality.":[17],"Convolutional":[18],"neural":[19],"network-based":[20],"(CNN-based)":[21],"SE":[22,36,43,175,181,187,193,201],"algorithms":[23,177],"literature":[25],"often":[26],"employ":[27],"generic":[28,183],"convolutional":[29,66,84],"filters":[30,67,102],"that":[31],"are":[32,129],"not":[33],"optimized":[34],"for":[35,73,94],"applications.":[37],"This":[38],"paper":[39],"presents":[40],"a":[41,179,185,191,199],"CNN-based":[42,174,180,186,192,200],"algorithm":[44,60],"with":[45,150,195,206,238],"an":[46,207],"adaptive":[47,96],"filter":[48],"design":[49],"(named":[50],"\u2018CNN-AFD\u2019)":[51],"using":[52],"Gabor":[53,63],"function":[54],"region-aware":[56,98,189],"convolution.":[57],"The":[58,77,100,168],"proposed":[59,169],"incorporates":[61],"fixed":[62],"functions":[64],"into":[65],"model":[69,162],"human":[70],"auditory":[71],"processing":[72,202],"improved":[74],"denoising":[75],"performance.":[76],"feature":[78],"maps":[79],"obtained":[80],"from":[81,105],"the":[82,115,121,135,204],"Gabor-incorporated":[83],"layers":[85],"serve":[86],"learnable":[88],"guided":[89],"masks":[90],"(tuned":[91],"at":[92,241],"backpropagation)":[93],"generating":[95],"custom":[97,101],"filters.":[99],"extract":[103],"features":[104],"regions":[107],"(i.e.,":[108,178],"\u2018region-aware\u2019)":[109],"while":[110],"maintaining":[111],"translation-invariance.":[112],"To":[113],"reduce":[114],"high":[116,151],"cost":[117],"of":[118,120,148,153,209,221],"inference":[119],"CNN,":[122],"skip":[123,132,157],"convolution":[124,133,158],"activation":[126],"analysis-wise":[127],"pruning":[128],"explored.":[130],"Employing":[131],"allowed":[134],"training":[136],"time":[137],"per":[138],"epoch":[139],"be":[141],"reduced":[142],"by":[143,164],"close":[144],"40%.":[146],"Pruning":[147],"neurons":[149],"numbers":[152],"zero":[154],"activations":[155],"complements":[156],"significantly":[160],"reduces":[161],"parameters":[163],"more":[165],"than":[166],"30%.":[167],"CNN-AFD":[170],"outperformed":[171],"all":[172],"four":[173],"baseline":[176],"employing":[182],"filters,":[184],"without":[188],"convolution,":[190],"trained":[194],"complex":[196],"spectrograms":[197],"time-domain)":[205],"average":[208],"0.95,":[210],"1.82":[211],"0.82":[213],"short-time":[215],"objective":[216],"(STOI),":[218],"perceptual":[219],"evaluation":[220],"quality":[223],"(PESQ)":[224],"logarithmic":[226],"spectral":[227],"distance":[228],"(LSD)":[229],"scores,":[230],"respectively,":[231],"when":[232],"tasked":[233],"denoise":[235],"contaminated":[237],"NOISEX-92":[239],"noises":[240],"-5,":[242],"0":[243],"5":[245],"dB":[246],"signal-to-noise":[247],"ratios":[248],"(SNRs).":[249]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
