{"id":"https://openalex.org/W4415708190","doi":"https://doi.org/10.1109/icme59968.2025.11208941","title":"Robust Generalized Zero-Shot Learning via Dual-Stream Variational Autoencoders and Out-of-Distribution Detection","display_name":"Robust Generalized Zero-Shot Learning via Dual-Stream Variational Autoencoders and Out-of-Distribution Detection","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4415708190","doi":"https://doi.org/10.1109/icme59968.2025.11208941"},"language":null,"primary_location":{"id":"doi:10.1109/icme59968.2025.11208941","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11208941","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101004315","display_name":"Xue Han","orcid":"https://orcid.org/0009-0008-1911-2674"},"institutions":[{"id":"https://openalex.org/I12615008","display_name":"Beijing Normal-Hong Kong Baptist University","ror":"https://ror.org/04snvc712","country_code":"CN","type":"education","lineage":["https://openalex.org/I12615008"]},{"id":"https://openalex.org/I141568987","display_name":"Hong Kong Baptist University","ror":"https://ror.org/0145fw131","country_code":"HK","type":"education","lineage":["https://openalex.org/I141568987"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Xue Han","raw_affiliation_strings":["Beijing Normal-Hong Kong Baptist University,Guangdong Provincial/Zhuhai Key Laboratory of IRADS,Department of Computer Science,Zhuhai,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Normal-Hong Kong Baptist University,Guangdong Provincial/Zhuhai Key Laboratory of IRADS,Department of Computer Science,Zhuhai,China","institution_ids":["https://openalex.org/I12615008","https://openalex.org/I141568987"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101619559","display_name":"Zhixiang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I12615008","display_name":"Beijing Normal-Hong Kong Baptist University","ror":"https://ror.org/04snvc712","country_code":"CN","type":"education","lineage":["https://openalex.org/I12615008"]},{"id":"https://openalex.org/I141568987","display_name":"Hong Kong Baptist University","ror":"https://ror.org/0145fw131","country_code":"HK","type":"education","lineage":["https://openalex.org/I141568987"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Zhixiang Li","raw_affiliation_strings":["Beijing Normal-Hong Kong Baptist University,Guangdong Provincial/Zhuhai Key Laboratory of IRADS,Department of Computer Science,Zhuhai,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Normal-Hong Kong Baptist University,Guangdong Provincial/Zhuhai Key Laboratory of IRADS,Department of Computer Science,Zhuhai,China","institution_ids":["https://openalex.org/I12615008","https://openalex.org/I141568987"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069202911","display_name":"Wenchuan Zhang","orcid":"https://orcid.org/0000-0001-9632-6424"},"institutions":[{"id":"https://openalex.org/I12615008","display_name":"Beijing Normal-Hong Kong Baptist University","ror":"https://ror.org/04snvc712","country_code":"CN","type":"education","lineage":["https://openalex.org/I12615008"]},{"id":"https://openalex.org/I141568987","display_name":"Hong Kong Baptist University","ror":"https://ror.org/0145fw131","country_code":"HK","type":"education","lineage":["https://openalex.org/I141568987"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Wenchuan Zhang","raw_affiliation_strings":["Beijing Normal-Hong Kong Baptist University,Guangdong Provincial/Zhuhai Key Laboratory of IRADS,Department of Computer Science,Zhuhai,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Normal-Hong Kong Baptist University,Guangdong Provincial/Zhuhai Key Laboratory of IRADS,Department of Computer Science,Zhuhai,China","institution_ids":["https://openalex.org/I12615008","https://openalex.org/I141568987"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106223300","display_name":"Hanyuan Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I119045251","display_name":"Huaqiao University","ror":"https://ror.org/03frdh605","country_code":"CN","type":"education","lineage":["https://openalex.org/I119045251"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanyuan Huang","raw_affiliation_strings":["Huaqiao University,Department of Computer Science and Technology,Xiamen,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Huaqiao University,Department of Computer Science and Technology,Xiamen,China","institution_ids":["https://openalex.org/I119045251"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056455910","display_name":"Wentao Fan","orcid":"https://orcid.org/0000-0001-6694-7289"},"institutions":[{"id":"https://openalex.org/I12615008","display_name":"Beijing Normal-Hong Kong Baptist University","ror":"https://ror.org/04snvc712","country_code":"CN","type":"education","lineage":["https://openalex.org/I12615008"]},{"id":"https://openalex.org/I141568987","display_name":"Hong Kong Baptist University","ror":"https://ror.org/0145fw131","country_code":"HK","type":"education","lineage":["https://openalex.org/I141568987"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Wentao Fan","raw_affiliation_strings":["Beijing Normal-Hong Kong Baptist University,Guangdong Provincial/Zhuhai Key Laboratory of IRADS,Department of Computer Science,Zhuhai,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Normal-Hong Kong Baptist University,Guangdong Provincial/Zhuhai Key Laboratory of IRADS,Department of Computer Science,Zhuhai,China","institution_ids":["https://openalex.org/I12615008","https://openalex.org/I141568987"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14876973,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.7203999757766724,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.7203999757766724,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.14810000360012054,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.03620000183582306,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.7300000190734863},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7185999751091003},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.5760999917984009},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.48649999499320984},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4336000084877014},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4235999882221222},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.41499999165534973},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.4099999964237213},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.40709999203681946}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7418000102043152},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.7300000190734863},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7185999751091003},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7053999900817871},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.5760999917984009},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4880000054836273},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.48649999499320984},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4336000084877014},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4235999882221222},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.41499999165534973},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.4099999964237213},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.40709999203681946},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.37779998779296875},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.3540000021457672},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.3456999957561493},{"id":"https://openalex.org/C2780440489","wikidata":"https://www.wikidata.org/wiki/Q5227278","display_name":"Data-driven","level":2,"score":0.3456000089645386},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.32710000872612},{"id":"https://openalex.org/C2988382989","wikidata":"https://www.wikidata.org/wiki/Q370685","display_name":"Data space","level":2,"score":0.32710000872612},{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.3149000108242035},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.303600013256073},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.3012000024318695},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.2957000136375427},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.27730000019073486},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C3020001037","wikidata":"https://www.wikidata.org/wiki/Q836575","display_name":"Quality assessment","level":3,"score":0.2653000056743622},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2590000033378601}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme59968.2025.11208941","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11208941","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2032699694","https://openalex.org/W2128532956","https://openalex.org/W2533598788","https://openalex.org/W2808717788","https://openalex.org/W2887567284","https://openalex.org/W2924476266","https://openalex.org/W2962689421","https://openalex.org/W2963283377","https://openalex.org/W2963499153","https://openalex.org/W2963960318","https://openalex.org/W2964149421","https://openalex.org/W2964162033","https://openalex.org/W2965373098","https://openalex.org/W2970539178","https://openalex.org/W2981648435","https://openalex.org/W2982234480","https://openalex.org/W2990947836","https://openalex.org/W3009656642","https://openalex.org/W3034730995","https://openalex.org/W3096831136","https://openalex.org/W3109728025","https://openalex.org/W3109994846","https://openalex.org/W3148105697","https://openalex.org/W3171926364","https://openalex.org/W3203055845","https://openalex.org/W4229482837","https://openalex.org/W4312283137","https://openalex.org/W4315643925","https://openalex.org/W4382466082","https://openalex.org/W4386076660","https://openalex.org/W4409917443"],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"we":[3,101],"propose":[4],"a":[5,31,38,75,107],"novel":[6],"Generalized":[7],"Zero-Shot":[8],"Learning":[9],"(GZSL)":[10],"approach":[11],"that":[12],"integrates":[13],"out-of-distribution":[14],"(OOD)":[15],"detection":[16],"mechanisms":[17],"into":[18],"the":[19,25,68,79,96,103,113,120,135],"architecture":[20],"of":[21,27,85,98,115,137],"generative":[22],"models.":[23],"At":[24],"core":[26],"our":[28,52,138],"method":[29],"is":[30],"dual-stream":[32,104],"Variational":[33],"Autoencoder":[34],"(VAE),":[35],"which":[36,82],"creates":[37],"unified":[39],"latent":[40,80],"space":[41],"to":[42,78],"align":[43],"data":[44,117,126],"distributions":[45],"from":[46],"different":[47],"modalities.":[48],"This":[49],"alignment":[50],"helps":[51],"model":[53,69],"better":[54],"identify":[55],"unseen":[56,88],"classes":[57,89],"by":[58,70],"reducing":[59],"bias":[60],"using":[61],"class-specific":[62],"distribution":[63],"ranges.":[64],"We":[65],"further":[66],"improve":[67],"adding":[71],"contrastive":[72],"learning":[73],"and":[74,87,90,118],"classification":[76],"loss":[77],"space,":[81],"separates":[83],"features":[84],"seen":[86],"reduces":[91],"feature":[92],"confusion.":[93],"To":[94],"enhance":[95],"quality":[97,114],"generated":[99],"data,":[100],"combine":[102],"VAE":[105],"with":[106],"Generative":[108],"Adversarial":[109],"Network":[110],"(GAN),":[111],"enhancing":[112],"synthetic":[116],"improving":[119],"model\u2019s":[121],"robustness":[122],"against":[123],"variations":[124],"in":[125,143],"distribution.":[127],"Extensive":[128],"validation":[129],"on":[130],"popular":[131],"benchmarks":[132],"has":[133],"confirmed":[134],"effectiveness":[136],"approach,":[139],"demonstrating":[140],"notable":[141],"improvements":[142],"GZSL":[144],"performance.":[145]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-30T00:00:00"}
