{"id":"https://openalex.org/W2647772669","doi":"https://doi.org/10.1109/icassp.2017.7953235","title":"Dereverberation based on bin-wise temporal variations of complex spectrogram","display_name":"Dereverberation based on bin-wise temporal variations of complex spectrogram","publication_year":2017,"publication_date":"2017-03-01","ids":{"openalex":"https://openalex.org/W2647772669","doi":"https://doi.org/10.1109/icassp.2017.7953235","mag":"2647772669"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2017.7953235","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2017.7953235","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053774403","display_name":"Tzu-Hao Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Tzu-Hao Chen","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu 300, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu 300, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109366871","display_name":"Chun Jung Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chun Huang","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu 300, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu 300, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088864528","display_name":"Tai-Shih Chi","orcid":"https://orcid.org/0000-0002-0584-8399"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Tai-Shih Chi","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu 300, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu 300, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5053774403"],"corresponding_institution_ids":["https://openalex.org/I148366613"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06547989,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"2","issue":null,"first_page":"5635","last_page":"5639"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.8266183137893677},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7395513653755188},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.639527440071106},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.6139531135559082},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.5681523680686951},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.558458685874939},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5152075886726379},{"id":"https://openalex.org/keywords/bin","display_name":"Bin","score":0.5052962899208069},{"id":"https://openalex.org/keywords/multiplicative-function","display_name":"Multiplicative function","score":0.46310847997665405},{"id":"https://openalex.org/keywords/time-domain","display_name":"Time domain","score":0.4390407204627991},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4243469834327698},{"id":"https://openalex.org/keywords/noise-measurement","display_name":"Noise measurement","score":0.4108179211616516},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.33934149146080017},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.18112823367118835},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15806668996810913},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.062202632427215576}],"concepts":[{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.8266183137893677},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7395513653755188},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.639527440071106},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.6139531135559082},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.5681523680686951},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.558458685874939},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5152075886726379},{"id":"https://openalex.org/C156273044","wikidata":"https://www.wikidata.org/wiki/Q4913766","display_name":"Bin","level":2,"score":0.5052962899208069},{"id":"https://openalex.org/C42747912","wikidata":"https://www.wikidata.org/wiki/Q1048447","display_name":"Multiplicative function","level":2,"score":0.46310847997665405},{"id":"https://openalex.org/C103824480","wikidata":"https://www.wikidata.org/wiki/Q185889","display_name":"Time domain","level":2,"score":0.4390407204627991},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4243469834327698},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.4108179211616516},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33934149146080017},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.18112823367118835},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15806668996810913},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.062202632427215576},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2017.7953235","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2017.7953235","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.6399999856948853}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1552314771","https://openalex.org/W1998648683","https://openalex.org/W2006129368","https://openalex.org/W2054139811","https://openalex.org/W2054480978","https://openalex.org/W2132214945","https://openalex.org/W2141998673","https://openalex.org/W2144433020","https://openalex.org/W2150057756","https://openalex.org/W2153894152","https://openalex.org/W2156676906","https://openalex.org/W2168610508","https://openalex.org/W2188162373","https://openalex.org/W2291877678","https://openalex.org/W3127686677","https://openalex.org/W6681573292","https://openalex.org/W6686978693","https://openalex.org/W6789826613"],"related_works":["https://openalex.org/W2530685530","https://openalex.org/W2107701374","https://openalex.org/W4375868962","https://openalex.org/W2011227383","https://openalex.org/W2088854863","https://openalex.org/W4402568167","https://openalex.org/W3179495260","https://openalex.org/W1976719989","https://openalex.org/W3127543252","https://openalex.org/W2065606036"],"abstract_inverted_index":{"Humans":[0],"analyze":[1],"sounds":[2],"not":[3],"only":[4],"based":[5,31],"on":[6,12],"their":[7],"frequency":[8,18,44],"contents,":[9,45],"but":[10],"also":[11],"the":[13,17,35,40,54,64,69,74,82,86,92,110],"temporal":[14,41],"variations":[15,42],"of":[16,43,85,100],"contents.":[19],"Inspired":[20],"by":[21],"auditory":[22],"perception,":[23],"we":[24,72],"propose":[25],"a":[26],"deep":[27],"neural":[28],"network":[29],"(DNN)":[30],"dereverberation":[32,113],"algorithm":[33,96],"in":[34,46,53,63],"rate":[36,65],"domain,":[37],"which":[38],"presents":[39],"this":[47],"paper.":[48],"We":[49],"show":[50,90],"convolutional":[51],"noise":[52,62],"time":[55],"domain":[56],"can":[57],"be":[58],"approximated":[59],"to":[60],"multiplicative":[61,70],"domain.":[66],"To":[67],"remove":[68],"noise,":[71],"adopt":[73],"rate-domain":[75,94],"complex-valued":[76],"ideal":[77],"ratio":[78],"mask":[79],"(RDcIRM)":[80],"as":[81],"training":[83],"target":[84],"DNN.":[87],"Simulation":[88],"results":[89],"that":[91],"proposed":[93],"DNN":[95],"is":[97,117],"more":[98],"capable":[99],"recovering":[101],"high-intelligible":[102],"and":[103],"high-quality":[104],"speech":[105,108,121],"from":[106],"reverberant":[107],"than":[109],"compared":[111],"state-of-the-art":[112],"algorithm.":[114],"Hence,":[115],"it":[116],"highly":[118],"suitable":[119],"for":[120],"applications":[122],"involving":[123],"human":[124],"listeners.":[125]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
