{"id":"https://openalex.org/W7140162767","doi":"https://doi.org/10.48550/arxiv.2603.21309","title":"Test-Time Adaptation via Cache Personalization for Facial Expression Recognition in Videos","display_name":"Test-Time Adaptation via Cache Personalization for Facial Expression Recognition in Videos","publication_year":2026,"publication_date":"2026-03-22","ids":{"openalex":"https://openalex.org/W7140162767","doi":"https://doi.org/10.48550/arxiv.2603.21309"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.21309","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21309","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.21309","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Sharafi, Masoumeh","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sharafi, Masoumeh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zeeshan, Muhammad Osama","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeeshan, Muhammad Osama","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Belharbi, Soufiane","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Belharbi, Soufiane","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Koerich, Alessandro Lameiras","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koerich, Alessandro Lameiras","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Pedersoli, Marco","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pedersoli, Marco","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Granger, Eric","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Granger, Eric","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.8481000065803528,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.8481000065803528,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.025299999862909317,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.009100000374019146,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.8384000062942505},{"id":"https://openalex.org/keywords/personalization","display_name":"Personalization","score":0.6862000226974487},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.5999000072479248},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5806999802589417},{"id":"https://openalex.org/keywords/cache-algorithms","display_name":"Cache algorithms","score":0.4456999897956848},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.39430001378059387},{"id":"https://openalex.org/keywords/facial-expression-recognition","display_name":"Facial expression recognition","score":0.3824999928474426},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.3249000012874603}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8668000102043152},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.8384000062942505},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.6862000226974487},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.5999000072479248},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5806999802589417},{"id":"https://openalex.org/C38556500","wikidata":"https://www.wikidata.org/wiki/Q13404475","display_name":"Cache algorithms","level":4,"score":0.4456999897956848},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.39430001378059387},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38769999146461487},{"id":"https://openalex.org/C2987714656","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Facial expression recognition","level":4,"score":0.3824999928474426},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3257000148296356},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.3249000012874603},{"id":"https://openalex.org/C201148951","wikidata":"https://www.wikidata.org/wiki/Q5015976","display_name":"Cache coloring","level":4,"score":0.3188999891281128},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.3003999888896942},{"id":"https://openalex.org/C113166858","wikidata":"https://www.wikidata.org/wiki/Q5015981","display_name":"Cache pollution","level":5,"score":0.2962999939918518},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.2806999981403351},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.2784000039100647},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.274399995803833},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.2727000117301941},{"id":"https://openalex.org/C167713795","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"Smart Cache","level":5,"score":0.2619999945163727},{"id":"https://openalex.org/C136085584","wikidata":"https://www.wikidata.org/wiki/Q910289","display_name":"Overlay","level":2,"score":0.25609999895095825},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2547000050544739}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.21309","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21309","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.21309","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21309","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Facial":[0],"expression":[1],"recognition":[2],"(FER)":[3],"in":[4,65],"videos":[5],"requires":[6],"model":[7],"personalization":[8,85],"to":[9,22,111,148],"capture":[10],"the":[11,150,173],"considerable":[12],"variations":[13],"across":[14],"subjects.":[15],"Vision-language":[16],"models":[17,39],"(VLMs)":[18],"offer":[19],"strong":[20],"transfer":[21],"downstream":[23],"tasks":[24],"through":[25,73,180],"image-text":[26],"alignment,":[27],"but":[28],"their":[29],"performance":[30],"can":[31,45,105,208],"still":[32],"degrade":[33],"under":[34,213],"inter-subject":[35],"distribution":[36],"shifts.":[37],"Personalizing":[38],"using":[40],"test-time":[41],"adaptation":[42],"(TTA)":[43],"methods":[44,53,94,212],"mitigate":[46],"this":[47],"challenge.":[48],"However,":[49],"most":[50],"state-of-the-art":[51,210],"TTA":[52,72,79,93,211],"rely":[54,95],"on":[55,97,166,195],"unsupervised":[56],"parameter":[57],"optimization,":[58],"introducing":[59],"computational":[60,221],"overhead":[61,224],"that":[62,81,100,123,131,141,187,206],"is":[63],"impractical":[64],"many":[66],"real-world":[67,226],"applications.":[68],"This":[69],"paper":[70],"introduces":[71],"Cache":[74,155],"Personalization":[75],"(TTA-CaP),":[76],"a":[77,119,127,137,162],"cache-based":[78,92],"method":[80],"enables":[82],"cost-effective":[83],"(gradient-free)":[84],"of":[86,152,182],"VLMs":[87],"for":[88,225],"video":[89,198],"FER.":[90],"Prior":[91],"solely":[96],"dynamic":[98],"memories":[99],"store":[101],"test":[102],"samples,":[103,135],"which":[104],"accumulate":[106],"errors":[107],"and":[108,136,157,170,203,215,222],"drift":[109],"due":[110],"noisy":[112,153],"pseudo-labels.":[113,154],"TTA-CaP":[114,177,207],"leverages":[115],"three":[116,196],"coordinated":[117],"caches:":[118],"personalized":[120,174],"source":[121],"cache":[122,130,140],"stores":[124,142],"source-domain":[125],"prototypes,":[126],"positive":[128],"target":[129,139],"accumulates":[132],"reliable":[133],"subject-specific":[134,214],"negative":[138,146],"low-confidence":[143],"cases":[144],"as":[145],"samples":[147],"reduce":[149],"impact":[151],"updates":[156],"replacement":[158],"are":[159],"controlled":[160],"by":[161],"tri-gate":[163],"mechanism":[164],"based":[165],"temporal":[167],"stability,":[168],"confidence,":[169],"consistency":[171],"with":[172],"cache.":[175],"Finally,":[176],"refines":[178],"predictions":[179],"fusion":[181],"embeddings,":[183],"yielding":[184],"refined":[185],"representations":[186],"support":[188],"temporally":[189],"stable":[190],"video-level":[191],"predictions.":[192],"Our":[193],"experiments":[194],"challenging":[197],"FER":[199],"datasets,":[200],"BioVid,":[201],"StressID,":[202],"BAH,":[204],"indicate":[205],"outperform":[209],"environmental":[216],"shifts,":[217],"while":[218],"maintaining":[219],"low":[220],"memory":[223],"deployment.":[227]},"counts_by_year":[],"updated_date":"2026-04-25T08:17:42.794288","created_date":"2026-03-25T00:00:00"}
