{"id":"https://openalex.org/W4313226937","doi":"https://doi.org/10.1109/besc57393.2022.9995148","title":"Multi-dimensional alignment via Variational Autoencoders for Generalized Zero-Shot and Few-Shot Learning","display_name":"Multi-dimensional alignment via Variational Autoencoders for Generalized Zero-Shot and Few-Shot Learning","publication_year":2022,"publication_date":"2022-10-29","ids":{"openalex":"https://openalex.org/W4313226937","doi":"https://doi.org/10.1109/besc57393.2022.9995148"},"language":"en","primary_location":{"id":"doi:10.1109/besc57393.2022.9995148","is_oa":false,"landing_page_url":"https://doi.org/10.1109/besc57393.2022.9995148","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 9th International Conference on Behavioural and Social Computing (BESC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://figshare.com/articles/conference_contribution/Multi-dimensional_alignment_via_Variational_Autoencoders_for_Generalized_Zero-Shot_and_Few-Shot_Learning/22124498","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004613426","display_name":"Jiyan Cai","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiyan Cai","raw_affiliation_strings":["Wuhan University,School of Cyber Science and Engineering,Wuhan,China","School of Cyber Science and Engineering, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Cyber Science and Engineering,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Cyber Science and Engineering, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108047844","display_name":"Libing Wu","orcid":"https://orcid.org/0000-0001-9897-1953"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Libing Wu","raw_affiliation_strings":["Wuhan University,School of Cyber Science and Engineering,Wuhan,China","School of Cyber Science and Engineering, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Cyber Science and Engineering,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Cyber Science and Engineering, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090936368","display_name":"Dan Wu","orcid":"https://orcid.org/0000-0001-9669-2600"},"institutions":[{"id":"https://openalex.org/I74413500","display_name":"University of Windsor","ror":"https://ror.org/01gw3d370","country_code":"CA","type":"education","lineage":["https://openalex.org/I74413500"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Dan Wu","raw_affiliation_strings":["University of Windsor,School of Computer Science,Ontario,Canada","School of Computer Science, University of Windsor, Ontario, Canada"],"affiliations":[{"raw_affiliation_string":"University of Windsor,School of Computer Science,Ontario,Canada","institution_ids":["https://openalex.org/I74413500"]},{"raw_affiliation_string":"School of Computer Science, University of Windsor, Ontario, Canada","institution_ids":["https://openalex.org/I74413500"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100380474","display_name":"Jianxin Li","orcid":"https://orcid.org/0000-0002-9059-330X"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Jianxin Li","raw_affiliation_strings":["Deakin University,School of Information Technology,Geelong,Australia","School of Information Technology, Deakin University, Geelong, Australia"],"affiliations":[{"raw_affiliation_string":"Deakin University,School of Information Technology,Geelong,Australia","institution_ids":["https://openalex.org/I149704539"]},{"raw_affiliation_string":"School of Information Technology, Deakin University, Geelong, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043353686","display_name":"Xianfeng Wu","orcid":"https://orcid.org/0000-0002-5113-5314"},"institutions":[{"id":"https://openalex.org/I31590910","display_name":"Jianghan University","ror":"https://ror.org/041c9x778","country_code":"CN","type":"education","lineage":["https://openalex.org/I31590910"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xianfeng Wu","raw_affiliation_strings":["Jianghan University,Institute for Interdisciplinary Research,Wuhan,China","Institute for Interdisciplinary Research, Jianghan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"Jianghan University,Institute for Interdisciplinary Research,Wuhan,China","institution_ids":["https://openalex.org/I31590910"]},{"raw_affiliation_string":"Institute for Interdisciplinary Research, Jianghan University, Wuhan, China","institution_ids":["https://openalex.org/I31590910"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5004613426"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":0.1389,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.57302889,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"30","issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9715999960899353,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.9588000178337097,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8214216232299805},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7891334295272827},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7261193990707397},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6243650913238525},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5754610300064087},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5547010898590088},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4823829233646393},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.4749719500541687},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.4449310004711151},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4363236725330353},{"id":"https://openalex.org/keywords/visual-space","display_name":"Visual space","score":0.43398404121398926},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.41474050283432007},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3242563009262085},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.32126384973526}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8214216232299805},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7891334295272827},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7261193990707397},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6243650913238525},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5754610300064087},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5547010898590088},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4823829233646393},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.4749719500541687},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.4449310004711151},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4363236725330353},{"id":"https://openalex.org/C207363949","wikidata":"https://www.wikidata.org/wiki/Q462915","display_name":"Visual space","level":3,"score":0.43398404121398926},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.41474050283432007},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3242563009262085},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.32126384973526},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/besc57393.2022.9995148","is_oa":false,"landing_page_url":"https://doi.org/10.1109/besc57393.2022.9995148","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 9th International Conference on Behavioural and Social Computing (BESC)","raw_type":"proceedings-article"},{"id":"pmh:oai:figshare.com:article/22124498","is_oa":true,"landing_page_url":"https://figshare.com/articles/conference_contribution/Multi-dimensional_alignment_via_Variational_Autoencoders_for_Generalized_Zero-Shot_and_Few-Shot_Learning/22124498","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:figshare.com:article/22124498","is_oa":true,"landing_page_url":"https://figshare.com/articles/conference_contribution/Multi-dimensional_alignment_via_Variational_Autoencoders_for_Generalized_Zero-Shot_and_Few-Shot_Learning/22124498","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"},"sustainable_development_goals":[{"score":0.7699999809265137,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1959608418","https://openalex.org/W2117539524","https://openalex.org/W2400717490","https://openalex.org/W2961408367","https://openalex.org/W2963283377","https://openalex.org/W2963499153","https://openalex.org/W2963960318","https://openalex.org/W2979571231","https://openalex.org/W3089741414","https://openalex.org/W3135727801","https://openalex.org/W3143107425","https://openalex.org/W3147476671","https://openalex.org/W4295521014","https://openalex.org/W6640963894","https://openalex.org/W6735913928","https://openalex.org/W6766206147"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W2074502265","https://openalex.org/W4214877189","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W2761785940","https://openalex.org/W156213964","https://openalex.org/W2050960118","https://openalex.org/W2129933262","https://openalex.org/W4390143830"],"abstract_inverted_index":{"Generalized":[0],"zero-shot":[1,183],"learning":[2],"(GZSL)":[3],"aims":[4],"to":[5,76,99,127,139,155],"solve":[6],"the":[7,15,56,60,64,68,72,78,81,89,114,121,133,144],"category":[8],"recognition":[9],"tasks":[10],"for":[11,52,110],"unseen":[12,25,137],"categories":[13,40],"under":[14,143],"setting":[16],"that":[17],"training":[18],"samples":[19],"only":[20],"contain":[21],"seen":[22,125],"classes":[23,26,62,70,109,126,138],"while":[24,87,131],"are":[27,36,96],"not":[28],"available.":[29],"This":[30],"research":[31],"is":[32],"vital":[33],"as":[34,184,186],"there":[35],"always":[37],"existing":[38],"new":[39],"and":[41,63,84,172],"large":[42],"amounts":[43],"of":[44,59,67,92,124,136,152],"unlabeled":[45],"data":[46],"in":[47,181],"realistic":[48],"scenarios.":[49],"Previous":[50],"work":[51],"GZSL":[53],"usually":[54],"maps":[55],"visual":[57,93,108,122],"information":[58,106,151],"visible":[61,83],"semantic":[65,134],"description":[66,135],"invisible":[69,85],"into":[71],"identical":[73],"embedding":[74,147],"space":[75,157],"bridge":[77],"gap":[79],"between":[80],"disjointed":[82],"classes,":[86],"ignoring":[88],"intrinsic":[90],"features":[91],"images,":[94],"which":[95],"sufficiently":[97],"discriminative":[98,105],"classify":[100],"themselves.":[101],"To":[102],"better":[103],"use":[104],"from":[107],"GZSL,":[111],"we":[112,119],"propose":[113],"n-CADA-VAE.":[115],"In":[116],"our":[117,177],"approach,":[118],"map":[120],"feature":[123],"a":[128,140],"high-dimensional":[129],"distribution":[130,142],"mapping":[132],"low-dimensional":[141],"same":[145],"latent":[146],"space,":[148],"thus":[149],"projecting":[150],"different":[153],"modalities":[154],"corresponding":[156],"positions":[158],"more":[159],"accurately.":[160],"We":[161],"conducted":[162],"extensive":[163],"experiments":[164],"on":[165],"four":[166],"benchmark":[167],"datasets":[168],"(CUB,":[169],"SUN,":[170],"AWA1,":[171],"AWA2).":[173],"The":[174],"results":[175],"show":[176],"model\u2019s":[178],"superior":[179],"performance":[180],"generalized":[182],"well":[185],"few-shot":[187],"learning.":[188]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
