{"id":"https://openalex.org/W4408353678","doi":"https://doi.org/10.1109/icassp49660.2025.10889363","title":"A Hierarchical Taxonomy For Deep State Space Models","display_name":"A Hierarchical Taxonomy For Deep State Space Models","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408353678","doi":"https://doi.org/10.1109/icassp49660.2025.10889363"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10889363","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889363","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://research.vu.nl/en/publications/eacd81e6-ab00-4b8e-830d-501a4275241b","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004341643","display_name":"Shiqin Tang","orcid":null},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Shiqin Tang","raw_affiliation_strings":["City University of Hong Kong,Department of Data Science,Hong Kong,Hong Kong"],"affiliations":[{"raw_affiliation_string":"City University of Hong Kong,Department of Data Science,Hong Kong,Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004050684","display_name":"Pengxing Feng","orcid":"https://orcid.org/0000-0002-8946-2388"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Pengxing Feng","raw_affiliation_strings":["City University of Hong Kong,Department of Electrical Engineering,Hong Kong"],"affiliations":[{"raw_affiliation_string":"City University of Hong Kong,Department of Electrical Engineering,Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041358503","display_name":"Shujian Yu","orcid":"https://orcid.org/0000-0002-6385-1705"},"institutions":[{"id":"https://openalex.org/I865915315","display_name":"Vrije Universiteit Amsterdam","ror":"https://ror.org/008xxew50","country_code":"NL","type":"education","lineage":["https://openalex.org/I865915315"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Shujian Yu","raw_affiliation_strings":["Vrije Universiteit Amsterdam,Department of Artificial Intelligence,Amsterdam,Netherlands"],"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Amsterdam,Department of Artificial Intelligence,Amsterdam,Netherlands","institution_ids":["https://openalex.org/I865915315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008216820","display_name":"Yining Dong","orcid":"https://orcid.org/0000-0002-4617-6947"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yining Dong","raw_affiliation_strings":["City University of Hong Kong,Department of Data Science,Hong Kong"],"affiliations":[{"raw_affiliation_string":"City University of Hong Kong,Department of Data Science,Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056937548","display_name":"S. Joe Qin","orcid":"https://orcid.org/0000-0001-7631-2535"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"S. Joe Qin","raw_affiliation_strings":["Lingnan University,Department of Computing and Decision Science,Hong Kong"],"affiliations":[{"raw_affiliation_string":"Lingnan University,Department of Computing and Decision Science,Hong Kong","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5004341643"],"corresponding_institution_ids":["https://openalex.org/I168719708"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.04797145,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12205","display_name":"Time Series Analysis and Forecasting","score":0.5867000222206116,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12205","display_name":"Time Series Analysis and Forecasting","score":0.5867000222206116,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/taxonomy","display_name":"Taxonomy (biology)","score":0.6717612147331238},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6556971073150635},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39227408170700073},{"id":"https://openalex.org/keywords/ecology","display_name":"Ecology","score":0.08135202527046204},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.06822261214256287}],"concepts":[{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.6717612147331238},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6556971073150635},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39227408170700073},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.08135202527046204},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.06822261214256287}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/icassp49660.2025.10889363","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889363","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:research.vu.nl:openaire/eacd81e6-ab00-4b8e-830d-501a4275241b","is_oa":true,"landing_page_url":"https://research.vu.nl/en/publications/eacd81e6-ab00-4b8e-830d-501a4275241b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401107","display_name":"VU Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I865915315","host_organization_name":"Vrije Universiteit Amsterdam","host_organization_lineage":["https://openalex.org/I865915315"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Tang, S, Feng, P, Yu, S, Dong, Y & Qin, S J 2025, A Hierarchical Taxonomy For Deep State Space Models. in B D Rao, I Trancoso, G Sharma & N B Mehta (eds), ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP) : [Proceedings]. ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings, vol. 2025, Institute of Electrical and Electronics Engineers Inc., pp. 1-5, 2025 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2025, Hyderabad, India, 6/04/25. https://doi.org/10.1109/ICASSP49660.2025.10889363","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:research.vu.nl:publications/eacd81e6-ab00-4b8e-830d-501a4275241b","is_oa":true,"landing_page_url":"https://hdl.handle.net/1871.1/eacd81e6-ab00-4b8e-830d-501a4275241b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401107","display_name":"VU Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I865915315","host_organization_name":"Vrije Universiteit Amsterdam","host_organization_lineage":["https://openalex.org/I865915315"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Tang, S, Feng, P, Yu, S, Dong, Y & Qin, S J 2025, A Hierarchical Taxonomy For Deep State Space Models. in B D Rao, I Trancoso, G Sharma & N B Mehta (eds), ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP) : [Proceedings]. ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings, vol. 2025, Institute of Electrical and Electronics Engineers Inc., pp. 1-5, 2025 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2025, Hyderabad, India, 6/04/25. https://doi.org/10.1109/ICASSP49660.2025.10889363","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"pmh:oai:research.vu.nl:openaire/eacd81e6-ab00-4b8e-830d-501a4275241b","is_oa":true,"landing_page_url":"https://research.vu.nl/en/publications/eacd81e6-ab00-4b8e-830d-501a4275241b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401107","display_name":"VU Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I865915315","host_organization_name":"Vrije Universiteit Amsterdam","host_organization_lineage":["https://openalex.org/I865915315"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Tang, S, Feng, P, Yu, S, Dong, Y & Qin, S J 2025, A Hierarchical Taxonomy For Deep State Space Models. in B D Rao, I Trancoso, G Sharma & N B Mehta (eds), ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP) : [Proceedings]. ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings, vol. 2025, Institute of Electrical and Electronics Engineers Inc., pp. 1-5, 2025 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2025, Hyderabad, India, 6/04/25. https://doi.org/10.1109/ICASSP49660.2025.10889363","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W2052441401","https://openalex.org/W2163922914","https://openalex.org/W2953223332","https://openalex.org/W2964232608","https://openalex.org/W2991019415","https://openalex.org/W3005621653","https://openalex.org/W3094953545","https://openalex.org/W3174902251","https://openalex.org/W3217536461","https://openalex.org/W4311841227","https://openalex.org/W4392910606","https://openalex.org/W6610566761","https://openalex.org/W6617744952","https://openalex.org/W6628877408","https://openalex.org/W6631190155","https://openalex.org/W6639735774","https://openalex.org/W6640963894","https://openalex.org/W6712395597","https://openalex.org/W6730998768","https://openalex.org/W6733471323","https://openalex.org/W6743827229","https://openalex.org/W6748392304","https://openalex.org/W6755447188","https://openalex.org/W6756256016","https://openalex.org/W6772911725","https://openalex.org/W6852702218"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Modeling":[0],"nonlinear":[1,113],"dynamical":[2],"systems":[3],"is":[4],"a":[5,22],"challenging":[6],"task":[7],"in":[8,129],"fields":[9],"such":[10],"as":[11],"speech":[12,130],"processing,":[13],"music":[14,133],"generation,":[15],"and":[16,38,41,60,74,125,131],"video":[17],"prediction.":[18],"This":[19],"paper":[20],"introduces":[21],"hierarchical":[23],"framework":[24],"for":[25,70,103,111],"Deep":[26],"State":[27,62,121],"Space":[28,63,122],"Models":[29],"(DSSMs),":[30],"categorizing":[31],"them":[32],"by":[33,84],"their":[34],"conditional":[35],"independence":[36],"properties":[37],"Markov":[39],"assumptions":[40],"positioning":[42],"existing":[43,96],"models":[44,97],"within":[45],"this":[46],"framework,":[47],"including":[48],"the":[49,71,93,101,104,119],"Stochastic":[50],"Recurrent":[51,56,61],"Neural":[52,57],"Network":[53,58],"(SRNN),":[54],"Variational":[55],"(VRNN),":[59],"Model":[64,123],"(RSSM).":[65],"We":[66],"discuss":[67],"different":[68],"options":[69],"inference":[72],"networks":[73],"demonstrate":[75],"how":[76],"integrating":[77],"normalizing":[78],"flows":[79],"can":[80],"enhance":[81],"model":[82],"flexibility":[83],"capturing":[85],"complex":[86],"distributions.":[87],"Our":[88],"work":[89],"not":[90],"only":[91],"clarifies":[92],"relationships":[94],"among":[95],"but":[98],"also":[99],"paves":[100],"way":[102],"development":[105],"of":[106],"new,":[107],"more":[108],"effective":[109],"approaches":[110],"modeling":[112,134],"dynamics.":[114],"In":[115],"particular,":[116],"we":[117],"propose":[118],"Autoregressive":[120],"(ArSSM)":[124],"evaluate":[126],"its":[127],"effectiveness":[128],"polyphonic":[132],"tasks.":[135]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
