{"id":"https://openalex.org/W4404238284","doi":"https://doi.org/10.1109/tcsvt.2024.3495533","title":"Variational Feature Imitation Conditioned on Visual Descriptions for Few-Shot Fine-Grained Recognition","display_name":"Variational Feature Imitation Conditioned on Visual Descriptions for Few-Shot Fine-Grained Recognition","publication_year":2024,"publication_date":"2024-11-11","ids":{"openalex":"https://openalex.org/W4404238284","doi":"https://doi.org/10.1109/tcsvt.2024.3495533"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3495533","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3495533","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100708142","display_name":"Xin Lu","orcid":"https://orcid.org/0009-0005-7669-1674"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xin Lu","raw_affiliation_strings":["School of Automation and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, Southeast University, Nanjing, China","Southeast University and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, School of Automation, Southeast University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0005-7669-1674","affiliations":[{"raw_affiliation_string":"School of Automation and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"Southeast University and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, School of Automation, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yixuan Pan","orcid":"https://orcid.org/0009-0005-6517-9739"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yixuan Pan","raw_affiliation_strings":["School of Automation and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, Southeast University, Nanjing, China","Southeast University and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, School of Automation, Southeast University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0005-6517-9739","affiliations":[{"raw_affiliation_string":"School of Automation and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"Southeast University and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, School of Automation, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090784541","display_name":"Yichao Cao","orcid":"https://orcid.org/0000-0003-2997-4012"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yichao Cao","raw_affiliation_strings":["School of Automation and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, Southeast University, Nanjing, China","Southeast University and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, School of Automation, Southeast University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0003-2997-4012","affiliations":[{"raw_affiliation_string":"School of Automation and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"Southeast University and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, School of Automation, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xin Zhou","orcid":"https://orcid.org/0009-0006-5525-435X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xin Zhou","raw_affiliation_strings":["Nanjing Enbo Technology Company Ltd., Nanjing, China","Nanjing Enbo Technology Co., Ltd, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0006-5525-435X","affiliations":[{"raw_affiliation_string":"Nanjing Enbo Technology Company Ltd., Nanjing, China","institution_ids":[]},{"raw_affiliation_string":"Nanjing Enbo Technology Co., Ltd, Nanjing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066658319","display_name":"Xiaobo Lu","orcid":"https://orcid.org/0000-0002-7707-7538"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaobo Lu","raw_affiliation_strings":["School of Automation and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, Southeast University, Nanjing, China","Southeast University and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, School of Automation, Southeast University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-7707-7538","affiliations":[{"raw_affiliation_string":"School of Automation and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"Southeast University and the Key Laboratory of Measurement and Control of Complex Systems of Engineering, Ministry of Education, School of Automation, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100708142"],"corresponding_institution_ids":["https://openalex.org/I76569877"],"apc_list":null,"apc_paid":null,"fwci":0.2381,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.54205322,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"35","issue":"3","first_page":"2215","last_page":"2229"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9842000007629395,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9842000007629395,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9824000000953674,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9559000134468079,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.680305004119873},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6279106736183167},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.606797456741333},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5736072659492493},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.5207369327545166},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5128567218780518},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.46316492557525635},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.45385512709617615},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.41966909170150757},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.09059077501296997}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.680305004119873},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6279106736183167},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.606797456741333},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5736072659492493},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.5207369327545166},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5128567218780518},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.46316492557525635},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.45385512709617615},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.41966909170150757},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.09059077501296997},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2024.3495533","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3495533","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2590141440","display_name":null,"funder_award_id":"62271143","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334059","display_name":"Research Computing Center, University of Chicago","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":79,"referenced_works":["https://openalex.org/W2138011018","https://openalex.org/W2167344194","https://openalex.org/W2752782242","https://openalex.org/W2797977484","https://openalex.org/W2904347197","https://openalex.org/W2928798948","https://openalex.org/W2957105406","https://openalex.org/W2959289524","https://openalex.org/W2963070905","https://openalex.org/W2963101867","https://openalex.org/W2963283377","https://openalex.org/W2963857746","https://openalex.org/W2964105864","https://openalex.org/W2965572487","https://openalex.org/W2979689312","https://openalex.org/W2981707695","https://openalex.org/W2982806777","https://openalex.org/W2991559096","https://openalex.org/W3006462480","https://openalex.org/W3009864380","https://openalex.org/W3022210053","https://openalex.org/W3025784200","https://openalex.org/W3034552520","https://openalex.org/W3034978645","https://openalex.org/W3046698617","https://openalex.org/W3092900959","https://openalex.org/W3107763055","https://openalex.org/W3137257446","https://openalex.org/W3157122767","https://openalex.org/W3165405144","https://openalex.org/W3176341011","https://openalex.org/W3198377975","https://openalex.org/W3201987584","https://openalex.org/W3213192039","https://openalex.org/W4280538209","https://openalex.org/W4283802957","https://openalex.org/W4287180559","https://openalex.org/W4289752563","https://openalex.org/W4304098587","https://openalex.org/W4311415873","https://openalex.org/W4312500832","https://openalex.org/W4312651322","https://openalex.org/W4312792327","https://openalex.org/W4313855822","https://openalex.org/W4316660800","https://openalex.org/W4320005661","https://openalex.org/W4321608200","https://openalex.org/W4376464610","https://openalex.org/W4382462216","https://openalex.org/W4385565405","https://openalex.org/W4386076063","https://openalex.org/W4386790226","https://openalex.org/W4387968000","https://openalex.org/W4387969056","https://openalex.org/W4390562736","https://openalex.org/W4390873185","https://openalex.org/W4390874575","https://openalex.org/W4392152061","https://openalex.org/W4392208008","https://openalex.org/W4393148571","https://openalex.org/W4394015587","https://openalex.org/W6638319203","https://openalex.org/W6687045409","https://openalex.org/W6736057607","https://openalex.org/W6744627333","https://openalex.org/W6751959828","https://openalex.org/W6767471572","https://openalex.org/W6780975210","https://openalex.org/W6790019176","https://openalex.org/W6790978476","https://openalex.org/W6791353385","https://openalex.org/W6798805250","https://openalex.org/W6810334672","https://openalex.org/W6811013733","https://openalex.org/W6838865580","https://openalex.org/W6849177959","https://openalex.org/W6853242345","https://openalex.org/W6857487352","https://openalex.org/W6861415825"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2935909890","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W1531601525","https://openalex.org/W2074502265"],"abstract_inverted_index":{"In":[0,165],"few-shot":[1,77],"fine-grained":[2,78,190],"recognition":[3,79,223],"(FS-FGR)":[4],"tasks,":[5],"the":[6,46,52,56,69,72,101,110,119,143,158,166,169,176,195,204,220],"main":[7],"challenge":[8],"is":[9,153,172,231],"to":[10,35,45,63,156],"distinguish":[11],"novel":[12],"categories":[13,125],"with":[14,81],"high":[15],"intra-class":[16,120,146],"variations":[17,121],"and":[18,67,109,182,225],"low":[19],"inter-class":[20],"differences":[21],"given":[22],"scarce":[23],"training":[24],"data.":[25],"Existing":[26],"studies":[27],"explore":[28],"discriminative":[29],"features":[30,136],"through":[31,162,175],"a":[32,105,115,129,148,215],"compact":[33,73],"network":[34],"avoid":[36],"overfitting,":[37],"while":[38],"they":[39],"achieve":[40],"marginal":[41],"performance":[42,70],"gain":[43],"owing":[44],"limited":[47],"representation":[48],"capability.":[49],"Motivated":[50],"by":[51,114,137,214],"significant":[53],"progress":[54],"of":[55,71,145,179],"vision":[57,106],"foundation":[58,107],"model,":[59],"we":[60,133],"introduce":[61],"it":[62],"describe":[64],"visual":[65,180],"attributes":[66],"boost":[68],"feature":[74,116,163],"extractor.":[75,117],"A":[76],"method":[80],"Variational":[82],"Feature":[83],"Imitation":[84],"Conditioned":[85],"on":[86,188,208],"Visual":[87],"Descriptions,":[88],"VFI-CVD":[89,197],"for":[90],"short,":[91],"has":[92],"been":[93],"proposed":[94,196],"in":[95,219],"this":[96],"paper.":[97],"It":[98,210],"simultaneously":[99],"exploits":[100],"pre-trained":[102],"knowledge":[103,112,159,171],"from":[104],"model":[108],"expert":[111],"mined":[113],"Specifically,":[118],"shared":[122],"across":[123],"object":[124],"are":[126],"encoded":[127],"into":[128],"common":[130],"distribution":[131],"thus":[132],"can":[134],"augment":[135],"sampling":[138],"latent":[139],"variables.":[140],"To":[141],"enhance":[142],"learning":[144],"variations,":[147],"condition":[149],"exchange":[150],"strategy":[151],"(CES)":[152],"put":[154],"forward":[155],"interact":[157],"between":[160],"samples":[161],"cross-imitation.":[164],"inference":[167],"stage,":[168],"learned":[170],"further":[173],"integrated":[174],"joint":[177],"prediction":[178],"descriptions":[181],"cross-imitated":[183],"features.":[184],"Comprehensive":[185],"experimental":[186],"results":[187],"four":[189],"benchmark":[191],"datasets":[192],"show":[193],"that":[194],"achieves":[198],"state-of-the-art":[199],"performance,":[200],"e.g.,":[201],"90.37%":[202],"under":[203],"5-way":[205],"1-shot":[206],"setting":[207],"CUB-200-2011.":[209],"surpasses":[211],"existing":[212],"methods":[213],"large":[216],"margin,":[217],"especially":[218],"challenging":[221],"30-way":[222],"tasks":[224],"cross-domain":[226],"evaluation.":[227],"The":[228],"source":[229],"code":[230],"publicly":[232],"available:":[233],"<uri":[234],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[235],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/Lx-zjwf/VFI-CVD</uri>.":[236]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
