{"id":"https://openalex.org/W4312496169","doi":"https://doi.org/10.1109/icpr56361.2022.9956303","title":"When Few-Shot Learning Meets Video Object Detection","display_name":"When Few-Shot Learning Meets Video Object Detection","publication_year":2022,"publication_date":"2022-08-21","ids":{"openalex":"https://openalex.org/W4312496169","doi":"https://doi.org/10.1109/icpr56361.2022.9956303"},"language":"en","primary_location":{"id":"doi:10.1109/icpr56361.2022.9956303","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr56361.2022.9956303","pdf_url":null,"source":{"id":"https://openalex.org/S4363607731","display_name":"2022 26th International Conference on Pattern Recognition (ICPR)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 26th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109589429","display_name":"Zhongjie Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhongjie Yu","raw_affiliation_strings":["Wyze Labs, Inc","University of Wisconsin, USA"],"affiliations":[{"raw_affiliation_string":"Wyze Labs, Inc","institution_ids":[]},{"raw_affiliation_string":"University of Wisconsin, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089410490","display_name":"Gaoang Wang","orcid":"https://orcid.org/0000-0002-8403-1538"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gaoang Wang","raw_affiliation_strings":["Zhejiang University,China","Zhejiang University, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,China","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100443680","display_name":"Lin Chen","orcid":"https://orcid.org/0000-0001-6426-6682"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin Chen","raw_affiliation_strings":["Wyze Labs, Inc"],"affiliations":[{"raw_affiliation_string":"Wyze Labs, Inc","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053156269","display_name":"Sebastian Raschka","orcid":"https://orcid.org/0000-0001-6989-4493"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sebastian Raschka","raw_affiliation_strings":["University of Wisconsin,USA","University of Wisconsin, USA"],"affiliations":[{"raw_affiliation_string":"University of Wisconsin,USA","institution_ids":[]},{"raw_affiliation_string":"University of Wisconsin, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055469774","display_name":"Jiebo Luo","orcid":"https://orcid.org/0000-0002-4516-9729"},"institutions":[{"id":"https://openalex.org/I5388228","display_name":"University of Rochester","ror":"https://ror.org/022kthw22","country_code":"US","type":"education","lineage":["https://openalex.org/I5388228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiebo Luo","raw_affiliation_strings":["University of Rochester,USA","University of Rochester, USA"],"affiliations":[{"raw_affiliation_string":"University of Rochester,USA","institution_ids":["https://openalex.org/I5388228"]},{"raw_affiliation_string":"University of Rochester, USA","institution_ids":["https://openalex.org/I5388228"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5109589429"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14921353,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2986","last_page":"2992"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8488845229148865},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.8229213356971741},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7730275392532349},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.7692145109176636},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7133975028991699},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.5791568160057068},{"id":"https://openalex.org/keywords/clips","display_name":"CLIPS","score":0.571998655796051},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5719634294509888},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.5428573489189148},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5196734070777893},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4730837941169739},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.4709162414073944},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4482573866844177},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.43879836797714233},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4382953643798828},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3512919545173645},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.16738766431808472},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.15965041518211365}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8488845229148865},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.8229213356971741},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7730275392532349},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.7692145109176636},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7133975028991699},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.5791568160057068},{"id":"https://openalex.org/C2778739407","wikidata":"https://www.wikidata.org/wiki/Q165372","display_name":"CLIPS","level":2,"score":0.571998655796051},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5719634294509888},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.5428573489189148},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5196734070777893},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4730837941169739},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.4709162414073944},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4482573866844177},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.43879836797714233},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4382953643798828},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3512919545173645},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.16738766431808472},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.15965041518211365},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpr56361.2022.9956303","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr56361.2022.9956303","pdf_url":null,"source":{"id":"https://openalex.org/S4363607731","display_name":"2022 26th International Conference on Pattern Recognition (ICPR)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 26th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W2117539524","https://openalex.org/W2194775991","https://openalex.org/W2601450892","https://openalex.org/W2604763608","https://openalex.org/W2609575245","https://openalex.org/W2625674597","https://openalex.org/W2796346823","https://openalex.org/W2894873912","https://openalex.org/W2895671740","https://openalex.org/W2962837320","https://openalex.org/W2963341924","https://openalex.org/W2963741406","https://openalex.org/W2964086649","https://openalex.org/W2964105864","https://openalex.org/W2964112702","https://openalex.org/W2964286567","https://openalex.org/W2979689312","https://openalex.org/W2983156430","https://openalex.org/W2990578161","https://openalex.org/W2994810768","https://openalex.org/W2996583130","https://openalex.org/W3010594275","https://openalex.org/W3034453888","https://openalex.org/W3034467781","https://openalex.org/W3034858314","https://openalex.org/W3034974675","https://openalex.org/W3035374961","https://openalex.org/W3035513921","https://openalex.org/W3088715381","https://openalex.org/W3101227480","https://openalex.org/W4294646197","https://openalex.org/W6620707391","https://openalex.org/W6717697761","https://openalex.org/W6735236233","https://openalex.org/W6736057607","https://openalex.org/W6750254146","https://openalex.org/W6753311412","https://openalex.org/W6755127997","https://openalex.org/W6755766585","https://openalex.org/W6758126075","https://openalex.org/W6774983715","https://openalex.org/W6782868315"],"related_works":["https://openalex.org/W4362597605","https://openalex.org/W2901505109","https://openalex.org/W2940082708","https://openalex.org/W4292829955","https://openalex.org/W2287881387","https://openalex.org/W4298299496","https://openalex.org/W2609618931","https://openalex.org/W2988815316","https://openalex.org/W3082619268","https://openalex.org/W4390755799"],"abstract_inverted_index":{"Different":[0],"from":[1,57,73,113],"static":[2],"images,":[3],"videos":[4,25],"contain":[5],"additional":[6],"temporal":[7],"and":[8,101,139,158,164,171,190],"spatial":[9],"information":[10],"for":[11,33,91,107],"better":[12],"object":[13,71,93,110,130,216],"detection.":[14,94],"However,":[15],"it":[16],"is":[17,181],"costly":[18],"to":[19,42,61,66,125,184],"obtain":[20],"a":[21,49,69,75,103,122,133,140],"large":[22,134],"number":[23,135],"of":[24,88,136,144,151,207],"with":[26,201],"bounding":[27],"box":[28],"annotations":[29],"that":[30],"are":[31],"required":[32],"supervised":[34],"deep":[35,53],"learning.":[36],"Although":[37],"humans":[38],"can":[39],"easily":[40],"learn":[41,68],"recognize":[43],"new":[44,86,104,213],"objects":[45,138],"by":[46],"watching":[47],"only":[48,74],"few":[50,76,141],"video":[51,70,78,92,109,129,142,215],"clips,":[52],"learning":[54,90],"usually":[55],"suffers":[56],"overfitting.":[58],"This":[59],"leads":[60],"an":[62],"important":[63],"question:":[64],"how":[65],"effectively":[67,126],"detector":[72,131],"labeled":[77],"clips?":[79],"In":[80],"this":[81,155,212],"paper,":[82],"we":[83,168],"study":[84],"the":[85,98,114,128,149,187,205],"problem":[87],"few-shot":[89,99,108,214],"We":[95,120],"first":[96],"define":[97],"setting":[100],"create":[102],"benchmark":[105,199],"dataset":[106],"detection":[111,217],"derived":[112],"widely":[115],"used":[116],"ImageNet":[117],"VID":[118],"dataset.":[119],"employ":[121],"transfer-learning":[123],"framework":[124,156],"train":[127],"on":[132,160,196],"base-class":[137],"clips":[143],"novel-class":[145],"objects.":[146],"By":[147],"analyzing":[148],"results":[150],"two":[152,188],"methods":[153],"under":[154],"(Joint":[157],"Freeze)":[159],"our":[161,192,197,208],"designed":[162],"weak":[163],"strong":[165],"base":[166],"datasets,":[167],"reveal":[169],"insufficiency":[170],"overfitting":[172],"problems.":[173],"A":[174],"simple":[175],"but":[176],"effective":[177],"method,":[178],"called":[179],"Thaw,":[180],"naturally":[182],"developed":[183],"trade":[185],"off":[186],"problems":[189],"validate":[191],"analysis.":[193],"Extensive":[194],"experiments":[195],"proposed":[198],"datasets":[200],"different":[202],"scenarios":[203],"demonstrate":[204],"effectiveness":[206],"novel":[209],"analysis":[210],"in":[211],"problem.":[218]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
