{"id":"https://openalex.org/W2939124443","doi":"https://doi.org/10.1109/icassp.2019.8683814","title":"Autoencoding HRTFS for DNN Based HRTF Personalization Using Anthropometric Features","display_name":"Autoencoding HRTFS for DNN Based HRTF Personalization Using Anthropometric Features","publication_year":2019,"publication_date":"2019-04-17","ids":{"openalex":"https://openalex.org/W2939124443","doi":"https://doi.org/10.1109/icassp.2019.8683814","mag":"2939124443"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2019.8683814","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2019.8683814","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2019 - 2019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110608735","display_name":"Tzu\u2010Yu Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Tzu-Yu Chen","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062616760","display_name":"Tzu-Hsuan Kuo","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Tzu-Hsuan Kuo","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088864528","display_name":"Tai-Shih Chi","orcid":"https://orcid.org/0000-0002-0584-8399"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Tai-Shih Chi","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National Chiao Tung University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110608735"],"corresponding_institution_ids":["https://openalex.org/I148366613"],"apc_list":null,"apc_paid":null,"fwci":2.0674,"has_fulltext":false,"cited_by_count":45,"citation_normalized_percentile":{"value":0.86425088,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"271","last_page":"275"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.987500011920929,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.9066994190216064},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.8604027032852173},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7153674364089966},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5871378779411316},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.580620288848877},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5239158868789673},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5191173553466797},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.47382983565330505},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.4437614381313324},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4148092567920685},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33672285079956055},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09467923641204834}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.9066994190216064},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.8604027032852173},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7153674364089966},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5871378779411316},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.580620288848877},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5239158868789673},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5191173553466797},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.47382983565330505},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.4437614381313324},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4148092567920685},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33672285079956055},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09467923641204834},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2019.8683814","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2019.8683814","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2019 - 2019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1505940281","https://openalex.org/W1582958321","https://openalex.org/W1971016029","https://openalex.org/W1974038455","https://openalex.org/W2001141328","https://openalex.org/W2023055131","https://openalex.org/W2025919462","https://openalex.org/W2043473991","https://openalex.org/W2059747271","https://openalex.org/W2087072911","https://openalex.org/W2094846694","https://openalex.org/W2095926185","https://openalex.org/W2108668360","https://openalex.org/W2111889754","https://openalex.org/W2116114278","https://openalex.org/W2258771979","https://openalex.org/W2290578471","https://openalex.org/W2396365566","https://openalex.org/W2762025550","https://openalex.org/W2764260703","https://openalex.org/W6676550410","https://openalex.org/W6692284154","https://openalex.org/W6745267900","https://openalex.org/W6745340762"],"related_works":["https://openalex.org/W1574414179","https://openalex.org/W4362597605","https://openalex.org/W3009056573","https://openalex.org/W2922073769","https://openalex.org/W4297676672","https://openalex.org/W4281702477","https://openalex.org/W4378510483","https://openalex.org/W4376166922","https://openalex.org/W2810330923","https://openalex.org/W4289763776"],"abstract_inverted_index":{"We":[0],"proposed":[1,96,124],"a":[2,46,65,101],"deep":[3],"neural":[4,80],"network":[5],"(DNN)":[6],"based":[7],"approach":[8,97,125],"to":[9,50,68,85,93,115],"synthesize":[10,69],"the":[11,23,27,52,58,62,70,76,79,117,123],"magnitude":[12,71],"of":[13,22,61,78,129],"personalized":[14],"head-related":[15],"transfer":[16],"functions":[17],"(HRTFs)":[18],"using":[19],"anthropometric":[20],"features":[21],"user.":[24],"To":[25],"mitigate":[26],"over-fitting":[28],"problem":[29],"when":[30],"training":[31],"dataset":[32],"is":[33],"not":[34],"very":[35],"large,":[36],"we":[37,56],"built":[38],"an":[39],"autoencoder":[40,63],"for":[41],"dimensional":[42],"reduction":[43],"and":[44],"establishing":[45],"crucial":[47],"feature":[48],"set":[49],"represent":[51],"raw":[53],"HRTFs.":[54,72],"Then":[55],"combined":[57],"decoder":[59],"part":[60],"with":[64,89,100,105,132],"smaller":[66],"DNN":[67,103],"In":[73],"this":[74],"way,":[75],"complexity":[77],"networks":[81],"was":[82,98,113],"greatly":[83],"reduced":[84],"prevent":[86],"unstable":[87],"results":[88,120],"large":[90],"variance":[91],"due":[92],"overfitting.":[94],"The":[95,108],"compared":[99],"baseline":[102],"model":[104],"no":[106],"autoencoder.":[107],"log-spectral":[109],"distortion":[110],"(LSD)":[111],"metric":[112],"used":[114],"evaluate":[116],"performance.":[118],"Experiment":[119],"show":[121],"that":[122],"can":[126],"reduce":[127],"LSD":[128],"estimated":[130],"HRTFs":[131],"greater":[133],"stability.":[134]},"counts_by_year":[{"year":2025,"cited_by_count":13},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
