{"id":"https://openalex.org/W4214652421","doi":"https://doi.org/10.1109/taslp.2022.3153266","title":"Sparse DNN Model for Frequency Expanding of Higher Order Ambisonics Encoding Process","display_name":"Sparse DNN Model for Frequency Expanding of Higher Order Ambisonics Encoding Process","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4214652421","doi":"https://doi.org/10.1109/taslp.2022.3153266"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2022.3153266","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2022.3153266","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100650768","display_name":"Shan Gao","orcid":"https://orcid.org/0000-0003-1189-7776"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shan Gao","raw_affiliation_strings":["Key Laboratory on Machine Perception (Ministry of Education), School of Artificial Intelligence, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory on Machine Perception (Ministry of Education), School of Artificial Intelligence, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101972535","display_name":"Lin Jing","orcid":"https://orcid.org/0000-0002-7046-8018"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Lin","raw_affiliation_strings":["Key Laboratory on Machine Perception (Ministry of Education), School of Artificial Intelligence, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory on Machine Perception (Ministry of Education), School of Artificial Intelligence, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084685506","display_name":"Xihong Wu","orcid":"https://orcid.org/0009-0004-5236-7469"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xihong Wu","raw_affiliation_strings":["Key Laboratory on Machine Perception (Ministry of Education), School of Artificial Intelligence, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory on Machine Perception (Ministry of Education), School of Artificial Intelligence, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103080532","display_name":"Tianshu Qu","orcid":"https://orcid.org/0000-0001-6256-2031"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianshu Qu","raw_affiliation_strings":["Key Laboratory on Machine Perception (Ministry of Education), School of Artificial Intelligence, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory on Machine Perception (Ministry of Education), School of Artificial Intelligence, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100650768"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":1.6375,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.82598511,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"30","issue":null,"first_page":"1124","last_page":"1135"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ambisonics","display_name":"Ambisonics","score":0.8432040214538574},{"id":"https://openalex.org/keywords/aliasing","display_name":"Aliasing","score":0.6814268827438354},{"id":"https://openalex.org/keywords/spherical-harmonics","display_name":"Spherical harmonics","score":0.6302218437194824},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5925440788269043},{"id":"https://openalex.org/keywords/sparse-approximation","display_name":"Sparse approximation","score":0.5756122469902039},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5508424043655396},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5052409768104553},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.4228995740413666},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.4179796278476715},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41589099168777466},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.40082815289497375},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.360627144575119},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2864277958869934},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.24147874116897583},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.14423099160194397},{"id":"https://openalex.org/keywords/loudspeaker","display_name":"Loudspeaker","score":0.09273287653923035}],"concepts":[{"id":"https://openalex.org/C47726159","wikidata":"https://www.wikidata.org/wiki/Q457547","display_name":"Ambisonics","level":3,"score":0.8432040214538574},{"id":"https://openalex.org/C4069607","wikidata":"https://www.wikidata.org/wiki/Q868732","display_name":"Aliasing","level":3,"score":0.6814268827438354},{"id":"https://openalex.org/C3768446","wikidata":"https://www.wikidata.org/wiki/Q877100","display_name":"Spherical harmonics","level":2,"score":0.6302218437194824},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5925440788269043},{"id":"https://openalex.org/C124066611","wikidata":"https://www.wikidata.org/wiki/Q28684319","display_name":"Sparse approximation","level":2,"score":0.5756122469902039},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5508424043655396},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5052409768104553},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.4228995740413666},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4179796278476715},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41589099168777466},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.40082815289497375},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.360627144575119},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2864277958869934},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.24147874116897583},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.14423099160194397},{"id":"https://openalex.org/C157138929","wikidata":"https://www.wikidata.org/wiki/Q570","display_name":"Loudspeaker","level":2,"score":0.09273287653923035},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C136536468","wikidata":"https://www.wikidata.org/wiki/Q1225894","display_name":"Undersampling","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2022.3153266","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2022.3153266","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.41999998688697815,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[{"id":"https://openalex.org/G2401495373","display_name":null,"funder_award_id":"61421062","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3389713118","display_name":null,"funder_award_id":"61175043","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6431705132","display_name":null,"funder_award_id":"U1713217","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8358198455","display_name":null,"funder_award_id":"2019YFC1408501","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1511723925","https://openalex.org/W1980903300","https://openalex.org/W1987213958","https://openalex.org/W1987906574","https://openalex.org/W1990055747","https://openalex.org/W2034119727","https://openalex.org/W2037814094","https://openalex.org/W2044468335","https://openalex.org/W2056212252","https://openalex.org/W2064233625","https://openalex.org/W2068815893","https://openalex.org/W2105808261","https://openalex.org/W2117678320","https://openalex.org/W2129501075","https://openalex.org/W2158941010","https://openalex.org/W2158995216","https://openalex.org/W2160525176","https://openalex.org/W2316102541","https://openalex.org/W2936333379","https://openalex.org/W4241672163","https://openalex.org/W6630773358","https://openalex.org/W6638896900","https://openalex.org/W6659849957","https://openalex.org/W6679718588","https://openalex.org/W7046848240"],"related_works":["https://openalex.org/W62656364","https://openalex.org/W4387871131","https://openalex.org/W2403497458","https://openalex.org/W4400519017","https://openalex.org/W1571600724","https://openalex.org/W2789837483","https://openalex.org/W2179914803","https://openalex.org/W2937253377","https://openalex.org/W2015882865","https://openalex.org/W1987213958"],"abstract_inverted_index":{"The":[0,135],"performance":[1,128,188],"of":[2,19,48,119,151],"higherorder":[3],"Ambisonics":[4],"(HOA)":[5],"signals":[6,38,70,103,146],"obtained":[7],"using":[8,44],"spherical":[9,86],"harmonics":[10,87],"decomposition":[11,58],"method":[12],"is":[13,42,133],"disturbed":[14],"by":[15,35],"two":[16],"primary":[17],"sources":[18,155],"errors,":[20],"the":[21,28,36,45,49,77,85,93,100,116,120,126,130,140,169,180,186,190],"noise":[22],"pollution":[23],"in":[24,31],"low-frequency":[25],"band":[26],"and":[27,160],"spatial":[29,94],"aliasing":[30,95],"high-frequency":[32],"band.":[33],"Inspired":[34],"HOA":[37,69,102,145],"upscale":[39],"method,":[40],"which":[41,99,123],"performed":[43],"sparse":[46,63,111,117,131],"character":[47],"sound":[50,56,121],"field,":[51],"this":[52],"paper":[53],"propose":[54],"a":[55,62,110],"field":[57,122],"model":[59,127,142,183],"based":[60,97],"on":[61,98],"deep":[64],"neural":[65],"network":[66,82,113,182],"that":[67,139],"offers":[68],"with":[71,147],"wider":[72,148],"frequency":[73,78,149],"bandwidth.":[74],"We":[75],"use":[76],"domain":[79],"multi-scale":[80],"convolutional":[81],"to":[83,114,157],"realize":[84],"decomposition,":[88],"as":[89,91,189],"well":[90],"learning":[92],"pattern,":[96],"aliasing-free":[101],"can":[104,143],"be":[105,173],"derived.":[106],"Besides,":[107],"we":[108],"apply":[109],"encoding":[112],"cpature":[115],"feature":[118,171],"will":[124],"improve":[125],"when":[129],"condition":[132],"satisfied.":[134],"experiments":[136],"results":[137],"prove":[138],"proposed":[141,181],"obtain":[144],"range":[150],"operation":[152],"under":[153],"multiple":[154],"(up":[156],"10":[158],"sources)":[159],"low":[161],"reverberant":[162],"environments":[163],"(<inline-formula><tex-math":[164,175],"notation=\"LaTeX\">$T_{60}\\le$</tex-math></inline-formula>":[165],"400":[166],"ms).":[167],"When":[168],"sparsity":[170],"cannot":[172],"satisfied":[174],"notation=\"LaTeX\">$T_{60}":[176],"=$</tex-math></inline-formula>":[177],"800":[178],"ms),":[179],"still":[184],"maintain":[185],"same":[187],"traditional":[191],"methods.":[192]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
