{"id":"https://openalex.org/W4387870105","doi":"https://doi.org/10.1109/mlsp55844.2023.10285887","title":"Predicting Room Impulse Responses Through Encoder-Decoder Convolutional Neural Networks","display_name":"Predicting Room Impulse Responses Through Encoder-Decoder Convolutional Neural Networks","publication_year":2023,"publication_date":"2023-09-17","ids":{"openalex":"https://openalex.org/W4387870105","doi":"https://doi.org/10.1109/mlsp55844.2023.10285887"},"language":"en","primary_location":{"id":"doi:10.1109/mlsp55844.2023.10285887","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp55844.2023.10285887","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 33rd International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101613019","display_name":"Ignacio Mart\u00edn","orcid":"https://orcid.org/0000-0002-1217-7546"},"institutions":[{"id":"https://openalex.org/I50357001","display_name":"Universidad Carlos III de Madrid","ror":"https://ror.org/03ths8210","country_code":"ES","type":"education","lineage":["https://openalex.org/I50357001"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"I. Martin","raw_affiliation_strings":["Universidad Carlos III de Madrid,Dep. Tecnolog&#x00ED;a Electr&#x00F3;nica,Spain"],"affiliations":[{"raw_affiliation_string":"Universidad Carlos III de Madrid,Dep. Tecnolog&#x00ED;a Electr&#x00F3;nica,Spain","institution_ids":["https://openalex.org/I50357001"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036496473","display_name":"Francisco Pastor","orcid":"https://orcid.org/0000-0003-0006-6811"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"F. Pastor","raw_affiliation_strings":["I3B, Universitat Polit&#x00E8;cnica de Val&#x00E8;ncia,Spain"],"affiliations":[{"raw_affiliation_string":"I3B, Universitat Polit&#x00E8;cnica de Val&#x00E8;ncia,Spain","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084588676","display_name":"F\u00e9lix Fuentes-Hurtado","orcid":"https://orcid.org/0000-0002-4320-245X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"F. Fuentes-Hurtado","raw_affiliation_strings":["Universidad Polit&#x00E9;cnica de Madrid,Dep. Sistemas Inform&#x00E1;ticos,Spain"],"affiliations":[{"raw_affiliation_string":"Universidad Polit&#x00E9;cnica de Madrid,Dep. Sistemas Inform&#x00E1;ticos,Spain","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056031998","display_name":"Jose A. Belloch","orcid":"https://orcid.org/0000-0002-2595-1828"},"institutions":[{"id":"https://openalex.org/I50357001","display_name":"Universidad Carlos III de Madrid","ror":"https://ror.org/03ths8210","country_code":"ES","type":"education","lineage":["https://openalex.org/I50357001"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"J.A. Belloch","raw_affiliation_strings":["Universidad Carlos III de Madrid,Dep. Tecnolog&#x00ED;a Electr&#x00F3;nica,Spain"],"affiliations":[{"raw_affiliation_string":"Universidad Carlos III de Madrid,Dep. Tecnolog&#x00ED;a Electr&#x00F3;nica,Spain","institution_ids":["https://openalex.org/I50357001"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000598119","display_name":"Luis A. Azpicueta-Ruiz","orcid":"https://orcid.org/0000-0002-2458-0914"},"institutions":[{"id":"https://openalex.org/I50357001","display_name":"Universidad Carlos III de Madrid","ror":"https://ror.org/03ths8210","country_code":"ES","type":"education","lineage":["https://openalex.org/I50357001"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"L. Azpicueta-Ruiz","raw_affiliation_strings":["Universidad Carlos III de Madrid,Dep. Teor&#x00ED;a de la Se&#x00F1;al y Comunicaciones,Spain"],"affiliations":[{"raw_affiliation_string":"Universidad Carlos III de Madrid,Dep. Teor&#x00ED;a de la Se&#x00F1;al y Comunicaciones,Spain","institution_ids":["https://openalex.org/I50357001"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043316752","display_name":"Valery Naranjo","orcid":"https://orcid.org/0000-0002-0181-3412"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"V. Naranjo","raw_affiliation_strings":["ITEAM, Universitat Polit&#x00E9;cnica de Val&#x00E8;ncia,Spain"],"affiliations":[{"raw_affiliation_string":"ITEAM, Universitat Polit&#x00E9;cnica de Val&#x00E8;ncia,Spain","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083332233","display_name":"Gema Pi\u00f1ero","orcid":"https://orcid.org/0000-0002-8719-8106"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"G. Pi\u00f1ero","raw_affiliation_strings":["ITEAM, Universitat Polit&#x00E9;cnica de Val&#x00E8;ncia,Spain"],"affiliations":[{"raw_affiliation_string":"ITEAM, Universitat Polit&#x00E9;cnica de Val&#x00E8;ncia,Spain","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101613019"],"corresponding_institution_ids":["https://openalex.org/I50357001"],"apc_list":null,"apc_paid":null,"fwci":0.6149,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.70131092,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/short-time-fourier-transform","display_name":"Short-time Fourier transform","score":0.789789080619812},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7346838712692261},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.7131825685501099},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5282406210899353},{"id":"https://openalex.org/keywords/fourier-transform","display_name":"Fourier transform","score":0.5166945457458496},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5116593837738037},{"id":"https://openalex.org/keywords/impulse","display_name":"Impulse (physics)","score":0.5107936859130859},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.49921131134033203},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48089170455932617},{"id":"https://openalex.org/keywords/impulse-response","display_name":"Impulse response","score":0.4614397883415222},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.4518851041793823},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.44636979699134827},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3966256082057953},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2433975338935852},{"id":"https://openalex.org/keywords/fourier-analysis","display_name":"Fourier analysis","score":0.16271913051605225},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.09103304147720337}],"concepts":[{"id":"https://openalex.org/C166386157","wikidata":"https://www.wikidata.org/wiki/Q1477735","display_name":"Short-time Fourier transform","level":4,"score":0.789789080619812},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7346838712692261},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.7131825685501099},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5282406210899353},{"id":"https://openalex.org/C102519508","wikidata":"https://www.wikidata.org/wiki/Q6520159","display_name":"Fourier transform","level":2,"score":0.5166945457458496},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5116593837738037},{"id":"https://openalex.org/C70836080","wikidata":"https://www.wikidata.org/wiki/Q837940","display_name":"Impulse (physics)","level":2,"score":0.5107936859130859},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.49921131134033203},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48089170455932617},{"id":"https://openalex.org/C72279823","wikidata":"https://www.wikidata.org/wiki/Q1139726","display_name":"Impulse response","level":2,"score":0.4614397883415222},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.4518851041793823},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.44636979699134827},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3966256082057953},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2433975338935852},{"id":"https://openalex.org/C203024314","wikidata":"https://www.wikidata.org/wiki/Q1365258","display_name":"Fourier analysis","level":3,"score":0.16271913051605225},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09103304147720337},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mlsp55844.2023.10285887","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp55844.2023.10285887","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 33rd International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320307785","display_name":"3M","ror":"https://ror.org/00mgss748"},{"id":"https://openalex.org/F4320334678","display_name":"European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W3189630","https://openalex.org/W1959608418","https://openalex.org/W2066853009","https://openalex.org/W2410879554","https://openalex.org/W2611901479","https://openalex.org/W2738467312","https://openalex.org/W2964041258","https://openalex.org/W2968047375","https://openalex.org/W2997574889","https://openalex.org/W3047687894","https://openalex.org/W3103001801","https://openalex.org/W3178031393","https://openalex.org/W3206257526","https://openalex.org/W4200470910","https://openalex.org/W4213021155","https://openalex.org/W4223461111","https://openalex.org/W4229050860","https://openalex.org/W4231225162","https://openalex.org/W4292969959","https://openalex.org/W4307687796","https://openalex.org/W4320015822","https://openalex.org/W4320015869","https://openalex.org/W4372341113","https://openalex.org/W6640963894","https://openalex.org/W6681096077","https://openalex.org/W6849761261"],"related_works":["https://openalex.org/W3013693939","https://openalex.org/W2159052453","https://openalex.org/W2566616303","https://openalex.org/W3131327266","https://openalex.org/W2734887215","https://openalex.org/W4297051394","https://openalex.org/W2752972570","https://openalex.org/W2145836866","https://openalex.org/W2272518678","https://openalex.org/W2140267235"],"abstract_inverted_index":{"This":[0],"paper":[1],"investigates":[2],"the":[3,33,55,65,69,73,84,87,92,99,103,106,110,121,149,158,161,167,171,174,180,183,193,200,203,220,223],"ability":[4,181,215],"of":[5,60,72,91,136,160,166,173,182,202],"deep":[6,27],"neural":[7],"networks":[8],"(DNNs)":[9],"to":[10,48,98,145,156,186,198,216],"predict":[11,199,209],"a":[12,39,44,50,61],"specific":[13],"room":[14,21,111],"impulse":[15],"response":[16],"(RIR)":[17],"between":[18],"two":[19],"given":[20],"locations.":[22],"We":[23],"use":[24],"three":[25,194],"end-to-end":[26],"learning":[28],"(DL)":[29],"models":[30,185],"based":[31],"on":[32,170],"encoder-decoder":[34],"structure:":[35],"an":[36,114],"auto-encoder":[37],"(AE),":[38],"variational":[40],"AE":[41],"(VAE)":[42],"and":[43,75,78,89,96,109,147,163],"UNet.":[45],"They":[46],"try":[47],"generate":[49],"new":[51,76],"RIR":[52,63],"given:":[53],"1)":[54],"short-time":[56],"Fourier":[57],"transform":[58],"(STFT)":[59],"true":[62,74],"from":[64],"same":[66],"room,":[67],"2)":[68],"spatial":[70,107],"coordinates":[71,108],"RIRs,":[77],"3)":[79],"several":[80],"room-related":[81],"parameters.":[82],"On":[83,102],"one":[85],"hand,":[86,105],"magnitude":[88,162,201],"phase":[90,164],"STFT":[93],"are":[94,196],"computed":[95],"presented":[97],"DNN":[100],"input.":[101],"other":[104],"parameters":[112],"form":[113],"information":[115],"vector":[116],"that":[117,192],"is":[118],"embedded":[119],"into":[120],"DNNs":[122,195],"through":[123],"their":[124,214],"latent":[125],"space":[126],"(AE,":[127],"VAE)":[128],"or":[129],"equivalent":[130],"layer":[131],"(UNet).":[132],"A":[133],"real":[134],"database":[135],"RIRs":[137],"measured":[138],"in":[139],"five":[140],"different":[141],"rooms":[142],"was":[143],"used":[144],"train":[146],"test":[148],"models.":[150,175],"Two":[151],"experiments":[152],"were":[153],"carried":[154],"out":[155],"study":[157],"influence":[159],"terms":[165],"loss":[168],"function":[169],"performance":[172],"An":[176],"additional":[177],"experiment":[178],"investigated":[179],"DL":[184],"generalize":[187,217],"across":[188,218],"rooms.":[189],"Results":[190],"show":[191],"able":[197],"STFT,":[204],"but":[205],"they":[206],"cannot":[207],"accurately":[208],"its":[210],"phase.":[211],"When":[212],"comparing":[213],"spaces,":[219],"UNet":[221],"achieves":[222],"best":[224],"results.":[225]},"counts_by_year":[{"year":2025,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
