{"id":"https://openalex.org/W4408353159","doi":"https://doi.org/10.1109/icassp49660.2025.10889788","title":"Disentanglement Analysis in Deep Latent Variable Models Matching Aggregate Posterior Distributions","display_name":"Disentanglement Analysis in Deep Latent Variable Models Matching Aggregate Posterior Distributions","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408353159","doi":"https://doi.org/10.1109/icassp49660.2025.10889788"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10889788","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889788","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066712825","display_name":"Surojit Saha","orcid":"https://orcid.org/0000-0002-3333-8070"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Surojit Saha","raw_affiliation_strings":["The University of Utah,SCI, Kahlert School of Computing,Salt Lake City,USA"],"affiliations":[{"raw_affiliation_string":"The University of Utah,SCI, Kahlert School of Computing,Salt Lake City,USA","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102835648","display_name":"Sarang Joshi","orcid":"https://orcid.org/0000-0002-3446-4810"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sarang Joshi","raw_affiliation_strings":["The University of Utah,SCI, Kahlert School of Computing,Salt Lake City,USA"],"affiliations":[{"raw_affiliation_string":"The University of Utah,SCI, Kahlert School of Computing,Salt Lake City,USA","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109840277","display_name":"Ross Whitaker","orcid":null},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ross Whitaker","raw_affiliation_strings":["The University of Utah,SCI, Kahlert School of Computing,Salt Lake City,USA"],"affiliations":[{"raw_affiliation_string":"The University of Utah,SCI, Kahlert School of Computing,Salt Lake City,USA","institution_ids":["https://openalex.org/I223532165"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5066712825"],"corresponding_institution_ids":["https://openalex.org/I223532165"],"apc_list":null,"apc_paid":null,"fwci":1.319,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.77945962,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8501999974250793,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8501999974250793,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/latent-variable","display_name":"Latent variable","score":0.7526512145996094},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6315488219261169},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.6222080588340759},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.5341137051582336},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5336086750030518},{"id":"https://openalex.org/keywords/latent-variable-model","display_name":"Latent variable model","score":0.5203920602798462},{"id":"https://openalex.org/keywords/variable","display_name":"Variable (mathematics)","score":0.448606014251709},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.4159941077232361},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32820069789886475},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.27348288893699646}],"concepts":[{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.7526512145996094},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6315488219261169},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.6222080588340759},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.5341137051582336},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5336086750030518},{"id":"https://openalex.org/C65965080","wikidata":"https://www.wikidata.org/wiki/Q1806885","display_name":"Latent variable model","level":3,"score":0.5203920602798462},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.448606014251709},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.4159941077232361},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32820069789886475},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27348288893699646},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10889788","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889788","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.6299999952316284}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2163922914","https://openalex.org/W2966574105","https://openalex.org/W2968131493","https://openalex.org/W3096515130","https://openalex.org/W4296051398","https://openalex.org/W4404931176","https://openalex.org/W6639732818","https://openalex.org/W6640963894","https://openalex.org/W6736057607","https://openalex.org/W6743661861","https://openalex.org/W6745535286","https://openalex.org/W6745687250","https://openalex.org/W6748223763","https://openalex.org/W6748445624","https://openalex.org/W6748499346","https://openalex.org/W6756663807","https://openalex.org/W6760514122","https://openalex.org/W6769849856","https://openalex.org/W6780248173","https://openalex.org/W6846207252","https://openalex.org/W6955712162"],"related_works":["https://openalex.org/W2461917396","https://openalex.org/W2037497866","https://openalex.org/W4243467573","https://openalex.org/W62001224","https://openalex.org/W1502435251","https://openalex.org/W3032390039","https://openalex.org/W1584341211","https://openalex.org/W3122667150","https://openalex.org/W3145681568","https://openalex.org/W4393387622"],"abstract_inverted_index":{"Deep":[0],"latent":[1,25,64,68,79,90,114,122,145,161],"variable":[2],"models":[3],"(DLVMs)":[4],"are":[5,21,86,96],"designed":[6],"to":[7,45,109,132],"learn":[8],"meaningful":[9],"representations":[10],"in":[11,41,84,138],"an":[12],"unsupervised":[13],"manner,":[14],"such":[15,99],"that":[16,58,77,154],"the":[17,46,49,60,63,67,78,82,89,101,106,110,113,121,144,148,159,166,169],"hidden":[18],"explanatory":[19],"factors":[20,65,150],"interpretable":[22],"by":[23],"independent":[24],"variables":[26,80,115],"(aka":[27],"disentanglement).":[28],"The":[29,140],"variational":[30],"autoencoder":[31],"(VAE)":[32],"[1],":[33],"[2]":[34],"is":[35],"a":[36,53,129,152],"popular":[37],"DLVM":[38],"widely":[39],"studied":[40],"disentanglement":[42,134],"analysis":[43],"due":[44],"modeling":[47],"of":[48,62,151,168],"posterior":[50,108],"distribution":[51,56],"using":[52],"factorized":[54],"Gaussian":[55],"[3]":[57],"encourages":[59],"alignment":[61],"with":[66,88,120],"axes.":[69,123,162],"Several":[70],"metrics":[71],"have":[72],"been":[73],"proposed":[74,141],"recently,":[75],"assuming":[76],"explaining":[81],"variation":[83],"data":[85],"aligned":[87,119],"axes":[91],"(cardinal":[92],"directions).":[93],"However,":[94],"there":[95],"other":[97],"DLVMs,":[98],"as":[100],"AAE":[102],"and":[103],"WAE-MMD":[104],"(matching":[105],"aggregate":[107],"prior),":[111],"where":[112],"might":[116],"not":[117],"be":[118,156],"In":[124],"this":[125],"work,":[126],"we":[127],"propose":[128],"statistical":[130],"method":[131,170],"evaluate":[133],"for":[135],"any":[136],"DLVMs":[137],"general.":[139],"technique":[142],"discovers":[143],"vectors":[146],"representing":[147],"generative":[149],"dataset":[153],"can":[155],"different":[157],"from":[158],"cardinal":[160],"We":[163],"empirically":[164],"demonstrate":[165],"advantage":[167],"on":[171],"two":[172],"datasets.":[173]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-19T19:40:27.379048","created_date":"2025-10-10T00:00:00"}
