{"id":"https://openalex.org/W4387682366","doi":"https://doi.org/10.1109/tcsvt.2023.3324648","title":"A Transferable Generative Framework for Multi-Label Zero-Shot Learning","display_name":"A Transferable Generative Framework for Multi-Label Zero-Shot Learning","publication_year":2023,"publication_date":"2023-10-16","ids":{"openalex":"https://openalex.org/W4387682366","doi":"https://doi.org/10.1109/tcsvt.2023.3324648"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2023.3324648","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3324648","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072105606","display_name":"Peirong Ma","orcid":"https://orcid.org/0000-0001-6391-7527"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Peirong Ma","raw_affiliation_strings":["Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101960599","display_name":"Zhiquan He","orcid":"https://orcid.org/0000-0002-6674-6003"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiquan He","raw_affiliation_strings":["Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031121165","display_name":"Wu Ran","orcid":"https://orcid.org/0000-0001-8478-0750"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wu Ran","raw_affiliation_strings":["Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070355771","display_name":"Hong Lu","orcid":"https://orcid.org/0000-0002-4572-2854"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong Lu","raw_affiliation_strings":["Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5072105606"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":1.5763,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.866571,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"34","issue":"5","first_page":"3409","last_page":"3423"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.974399983882904,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10515","display_name":"Cancer-related molecular mechanisms research","score":0.9648000001907349,"subfield":{"id":"https://openalex.org/subfields/1306","display_name":"Cancer Research"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6883785724639893},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6745659112930298},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6461962461471558},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5639045238494873},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5416219234466553},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4746152460575104},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.46477511525154114},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4619693160057068},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.45092886686325073},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.44184139370918274},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.417167603969574},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.3679402768611908}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6883785724639893},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6745659112930298},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6461962461471558},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5639045238494873},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5416219234466553},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4746152460575104},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.46477511525154114},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4619693160057068},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.45092886686325073},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.44184139370918274},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.417167603969574},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3679402768611908},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2023.3324648","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3324648","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","display_name":"Life below water","score":0.7900000214576721}],"awards":[{"id":"https://openalex.org/G7143284523","display_name":null,"funder_award_id":"62072112","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":79,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1797268635","https://openalex.org/W1849277567","https://openalex.org/W1861492603","https://openalex.org/W2007972815","https://openalex.org/W2032699694","https://openalex.org/W2098411764","https://openalex.org/W2108598243","https://openalex.org/W2128532956","https://openalex.org/W2141350700","https://openalex.org/W2171061940","https://openalex.org/W2187089797","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2251771443","https://openalex.org/W2398118205","https://openalex.org/W2413850928","https://openalex.org/W2552383788","https://openalex.org/W2577784528","https://openalex.org/W2924476266","https://openalex.org/W2932399282","https://openalex.org/W2949952652","https://openalex.org/W2963052338","https://openalex.org/W2963499153","https://openalex.org/W2964105864","https://openalex.org/W2979571231","https://openalex.org/W2997998901","https://openalex.org/W2998124234","https://openalex.org/W2998420437","https://openalex.org/W3003930651","https://openalex.org/W3014645216","https://openalex.org/W3034978279","https://openalex.org/W3104069527","https://openalex.org/W3109283569","https://openalex.org/W3109728025","https://openalex.org/W3136203352","https://openalex.org/W3163811911","https://openalex.org/W3165181705","https://openalex.org/W3171926364","https://openalex.org/W3192931333","https://openalex.org/W3202858701","https://openalex.org/W3203055845","https://openalex.org/W3210749271","https://openalex.org/W3211407538","https://openalex.org/W4214673031","https://openalex.org/W4229044990","https://openalex.org/W4229482837","https://openalex.org/W4281780077","https://openalex.org/W4293518071","https://openalex.org/W4294170691","https://openalex.org/W4295788787","https://openalex.org/W4296708598","https://openalex.org/W4296739197","https://openalex.org/W4310418568","https://openalex.org/W4311415873","https://openalex.org/W4312458986","https://openalex.org/W4312559104","https://openalex.org/W4312563428","https://openalex.org/W4312747482","https://openalex.org/W4312773012","https://openalex.org/W4318953229","https://openalex.org/W4319778743","https://openalex.org/W4382450414","https://openalex.org/W4384306363","https://openalex.org/W4386075561","https://openalex.org/W4386415485","https://openalex.org/W6603820874","https://openalex.org/W6621740533","https://openalex.org/W6636510571","https://openalex.org/W6637373629","https://openalex.org/W6638319203","https://openalex.org/W6678470764","https://openalex.org/W6678800043","https://openalex.org/W6735913928","https://openalex.org/W6752083267","https://openalex.org/W6789387562","https://openalex.org/W6791353385","https://openalex.org/W6845373907","https://openalex.org/W6846835116"],"related_works":["https://openalex.org/W4396941953","https://openalex.org/W2093104230","https://openalex.org/W2987280934","https://openalex.org/W4390874210","https://openalex.org/W4384918963","https://openalex.org/W4365211920","https://openalex.org/W2128027845","https://openalex.org/W3014948380","https://openalex.org/W4386184937","https://openalex.org/W4394728283"],"abstract_inverted_index":{"Multi-label":[0],"zero-shot":[1,13],"learning":[2,14],"(MLZSL)":[3],"is":[4],"a":[5,24,48,56,62,70,108,143],"more":[6,120],"realistic":[7],"and":[8,35,69,119,130,138,188,195],"challenging":[9],"task":[10,34,182],"than":[11],"single-label":[12,112],"(SLZSL),":[15],"which":[16,53],"aims":[17],"to":[18,31,85,133],"recognize":[19,37,135],"multiple":[20,38],"unseen":[21,39],"classes":[22,92],"in":[23,42,142],"single":[25],"image.":[26],"To":[27],"adapt":[28],"generative":[29,165],"models":[30],"the":[32,80,98,136,162,176,179],"MLZSL":[33,166],"better":[36,134],"object":[40,140],"categories":[41,141],"an":[43],"image,":[44,145],"this":[45],"paper":[46],"proposes":[47],"Transferable":[49],"Generative":[50],"Framework":[51],"(TGF),":[52],"consists":[54],"of":[55,91,178],"Multi-Label":[57,64,71],"Semantic":[58],"Embedding":[59],"Autoencoders":[60],"(SEAs),":[61],"Semantic-Related":[63],"Feature":[65,72],"Transformation":[66],"Network":[67],"(FTN)":[68],"Generation":[73],"Networks":[74],"(FGNs).":[75],"First,":[76],"SEAs":[77],"adaptively":[78],"encodes":[79],"class-level":[81],"word":[82],"vectors":[83],"corresponding":[84],"each":[86],"sample":[87],"containing":[88],"different":[89],"number":[90],"into":[93,114],"sample-level":[94],"semantic":[95],"embeddings":[96],"with":[97,161],"same":[99],"dimension.":[100],"Then,":[101],"FTN":[102],"transforms":[103],"global":[104,129],"features":[105,115,132],"extracted":[106],"by":[107,183],"CNN":[109],"pre-trained":[110],"on":[111,149,191],"images":[113],"that":[116,154],"are":[117],"semantic-related":[118],"suitable":[121],"for":[122],"multi-label":[123,144],"classification.":[124],"Finally,":[125],"FGNs":[126],"generates":[127],"both":[128],"local":[131],"dominant":[137],"minor":[139],"respectively.":[146,198],"Extensive":[147],"experiments":[148],"three":[150],"benchmark":[151],"datasets":[152],"show":[153],"TGF":[155,174],"significantly":[156],"outperforms":[157],"state-of-the-arts.":[158],"Specifically,":[159],"compared":[160],"previous":[163],"best":[164],"method":[167],"(":[168],"<italic":[169],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[170],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">i.e</i>":[171],".,":[172],"Gen-MLZSL),":[173],"improves":[175],"mAP":[177],"ZSL":[180],"(GZSL)":[181],"5.4%":[184],"(6.9%),":[185],"20.5%":[186],"(27.9%),":[187],"2.4%":[189],"(3.9%)":[190],"NUS-WIDE,":[192],"Open":[193],"Images,":[194],"MS-COCO":[196],"datasets,":[197]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
