{"id":"https://openalex.org/W4292794834","doi":"https://doi.org/10.1109/cvprw56347.2022.00422","title":"Continual Learning with Transformers for Image Classification","display_name":"Continual Learning with Transformers for Image Classification","publication_year":2022,"publication_date":"2022-06-01","ids":{"openalex":"https://openalex.org/W4292794834","doi":"https://doi.org/10.1109/cvprw56347.2022.00422"},"language":"en","primary_location":{"id":"doi:10.1109/cvprw56347.2022.00422","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvprw56347.2022.00422","pdf_url":null,"source":{"id":"https://openalex.org/S4363607748","display_name":"2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057377890","display_name":"Beyza Ermi\u015f","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Beyza Ermis","raw_affiliation_strings":["AWS,Berlin","AWS, Berlin"],"affiliations":[{"raw_affiliation_string":"AWS,Berlin","institution_ids":[]},{"raw_affiliation_string":"AWS, Berlin","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004208244","display_name":"Giovanni Zappella","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Giovanni Zappella","raw_affiliation_strings":["AWS,Berlin","AWS, Berlin"],"affiliations":[{"raw_affiliation_string":"AWS,Berlin","institution_ids":[]},{"raw_affiliation_string":"AWS, Berlin","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002232506","display_name":"Martin Wistuba","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Martin Wistuba","raw_affiliation_strings":["AWS,Berlin","AWS, Berlin"],"affiliations":[{"raw_affiliation_string":"AWS,Berlin","institution_ids":[]},{"raw_affiliation_string":"AWS, Berlin","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111881609","display_name":"Aditya Rawal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aditya Rawal","raw_affiliation_strings":["AWS,Santa Clara","AWS, Santa Clara"],"affiliations":[{"raw_affiliation_string":"AWS,Santa Clara","institution_ids":[]},{"raw_affiliation_string":"AWS, Santa Clara","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021107714","display_name":"C\u00e9dric Archambeau","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cedric Archambeau","raw_affiliation_strings":["AWS,Berlin","AWS, Berlin"],"affiliations":[{"raw_affiliation_string":"AWS,Berlin","institution_ids":[]},{"raw_affiliation_string":"AWS, Berlin","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5057377890"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6621,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.86010558,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"3773","last_page":"3780"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.972000002861023,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/forgetting","display_name":"Forgetting","score":0.816430389881134},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.799907386302948},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.643912672996521},{"id":"https://openalex.org/keywords/retraining","display_name":"Retraining","score":0.6412273645401001},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6388610005378723},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6073898077011108},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5929527282714844},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5614564418792725},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5130025744438171},{"id":"https://openalex.org/keywords/scratch","display_name":"Scratch","score":0.46968987584114075},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1181158721446991}],"concepts":[{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.816430389881134},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.799907386302948},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.643912672996521},{"id":"https://openalex.org/C2778712577","wikidata":"https://www.wikidata.org/wiki/Q3505966","display_name":"Retraining","level":2,"score":0.6412273645401001},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6388610005378723},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6073898077011108},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5929527282714844},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5614564418792725},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5130025744438171},{"id":"https://openalex.org/C2781235140","wikidata":"https://www.wikidata.org/wiki/Q275131","display_name":"Scratch","level":2,"score":0.46968987584114075},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1181158721446991},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C155202549","wikidata":"https://www.wikidata.org/wiki/Q178803","display_name":"International trade","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvprw56347.2022.00422","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvprw56347.2022.00422","pdf_url":null,"source":{"id":"https://openalex.org/S4363607748","display_name":"2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6000000238418579}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W1682403713","https://openalex.org/W2108598243","https://openalex.org/W2117539524","https://openalex.org/W2560647685","https://openalex.org/W2734314755","https://openalex.org/W2808439681","https://openalex.org/W2902456977","https://openalex.org/W2922466325","https://openalex.org/W2926477959","https://openalex.org/W2948734064","https://openalex.org/W2948743095","https://openalex.org/W2954929116","https://openalex.org/W2962945654","https://openalex.org/W2963438784","https://openalex.org/W2963540014","https://openalex.org/W2964189064","https://openalex.org/W2964303773","https://openalex.org/W2970200208","https://openalex.org/W2979826702","https://openalex.org/W2980994576","https://openalex.org/W3007522628","https://openalex.org/W3013325675","https://openalex.org/W3094502228","https://openalex.org/W3098170909","https://openalex.org/W3107810305","https://openalex.org/W3118608800","https://openalex.org/W3153675281","https://openalex.org/W3168403139","https://openalex.org/W3170874841","https://openalex.org/W3171057731","https://openalex.org/W3180392831","https://openalex.org/W4221164031","https://openalex.org/W4225484930","https://openalex.org/W4225871896","https://openalex.org/W4288336773","https://openalex.org/W4292779060","https://openalex.org/W4295883599","https://openalex.org/W4385245566","https://openalex.org/W6730146409","https://openalex.org/W6739901393","https://openalex.org/W6742852309","https://openalex.org/W6749495938","https://openalex.org/W6752530194","https://openalex.org/W6756754374","https://openalex.org/W6759579507","https://openalex.org/W6760883817","https://openalex.org/W6761469101","https://openalex.org/W6767674130","https://openalex.org/W6774108707","https://openalex.org/W6778883912","https://openalex.org/W6781568746","https://openalex.org/W6784333009","https://openalex.org/W6787972765","https://openalex.org/W6788135285","https://openalex.org/W6796390573","https://openalex.org/W6805023924","https://openalex.org/W6810241840","https://openalex.org/W6810653034"],"related_works":["https://openalex.org/W2475116013","https://openalex.org/W2770018148","https://openalex.org/W2358308169","https://openalex.org/W2385135707","https://openalex.org/W2140315382","https://openalex.org/W2059109728","https://openalex.org/W4206178588","https://openalex.org/W3094491777","https://openalex.org/W3214715529","https://openalex.org/W4287635093"],"abstract_inverted_index":{"In":[0,159],"many":[1],"real-world":[2],"scenarios,":[3],"data":[4,56],"to":[5,19,45,48,129,148,150,181,232],"train":[6],"machine":[7],"learning":[8,184],"models":[9,17],"become":[10],"available":[11,95],"over":[12,220],"time.":[13,222],"However,":[14],"neural":[15,73],"network":[16],"struggle":[18,147],"continually":[20],"learn":[21],"new":[22],"concepts":[23],"without":[24,156,209],"forgetting":[25,39,119],"what":[26],"has":[27],"been":[28],"learnt":[29],"in":[30,96,121,164],"the":[31,53,62,97,114,131,165,211,215,221,233],"past.":[32],"This":[33],"phenomenon":[34],"is":[35,42,80,179,225],"known":[36],"as":[37,52,76],"catastrophic":[38,118],"and":[40,83,136,188],"it":[41,224],"often":[43],"difficult":[44],"prevent":[46],"due":[47],"practical":[49],"constraints,":[50],"such":[51,75],"amount":[54,87],"of":[55,88,100,113,134,154,175,217],"that":[57,66,106,201],"can":[58,67,116],"be":[59,68,94],"stored":[60],"or":[61,213],"limited":[63],"computation":[64],"sources":[65],"used.":[69],"Moreover,":[70],"training":[71,89],"large":[72,152],"networks,":[74],"Transformers,":[77],"from":[78],"scratch":[79],"very":[81],"costly":[82],"requires":[84],"a":[85,144,151,169,205],"vast":[86],"data,":[90],"which":[91,178],"might":[92],"not":[93],"application":[98],"domain":[99,168],"interest.":[101],"A":[102],"recent":[103,170],"trend":[104],"indicates":[105],"dynamic":[107],"architectures":[108],"based":[109],"on":[110,190,197],"an":[111],"expansion":[112],"parameters":[115,135,219],"reduce":[117],"efficiently":[120],"continual":[122,183],"learning,":[123],"but":[124],"this":[125,160,202],"needs":[126],"complex":[127],"tuning":[128],"balance":[130],"growing":[132],"number":[133,153,216],"barely":[137],"share":[138],"any":[139],"information":[140],"across":[141],"tasks.":[142,193],"As":[143],"result,":[145],"they":[146],"scale":[149],"tasks":[155,200],"significant":[157],"overhead.":[158],"paper,":[161],"we":[162],"validate":[163],"computer":[166],"vision":[167],"solution":[171],"called":[172],"Adaptive":[173],"Distillation":[174],"Adapters":[176,189],"(ADA),":[177],"developed":[180],"perform":[182],"using":[185],"pre-trained":[186],"Transformers":[187],"text":[191],"classification":[192,199],"We":[194],"empirically":[195],"demonstrate":[196],"different":[198],"method":[203],"maintains":[204],"good":[206],"predictive":[207],"performance":[208],"retraining":[210],"model":[212,218],"increasing":[214],"Besides":[223],"significantly":[226],"faster":[227],"at":[228],"inference":[229],"time":[230],"compared":[231],"state-of-the-art":[234],"methods.":[235]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
