{"id":"https://openalex.org/W4415538248","doi":"https://doi.org/10.1145/3746027.3755740","title":"PatAug: Augmentation of Augmentation for Test-Time Adaptation","display_name":"PatAug: Augmentation of Augmentation for Test-Time Adaptation","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415538248","doi":"https://doi.org/10.1145/3746027.3755740"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3755740","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755740","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101478197","display_name":"Xinyao Li","orcid":"https://orcid.org/0000-0002-5109-9966"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xinyao Li","raw_affiliation_strings":["University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-5109-9966","affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004072001","display_name":"D Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dan Zhang","raw_affiliation_strings":["University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0009-0003-9846-7775","affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003786587","display_name":"Zhekai Du","orcid":"https://orcid.org/0000-0002-9406-3920"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhekai Du","raw_affiliation_strings":["University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-9406-3920","affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108048954","display_name":"Lei Zhu","orcid":"https://orcid.org/0000-0002-2993-7142"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Zhu","raw_affiliation_strings":["Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-2993-7142","affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100456835","display_name":"Zhi Chen","orcid":"https://orcid.org/0000-0002-9385-144X"},"institutions":[{"id":"https://openalex.org/I185523456","display_name":"University of Southern Queensland","ror":"https://ror.org/04sjbnx57","country_code":"AU","type":"education","lineage":["https://openalex.org/I185523456"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Zhi Chen","raw_affiliation_strings":["University of Southern Queensland, Toowoomba, Australia"],"raw_orcid":"https://orcid.org/0000-0002-9385-144X","affiliations":[{"raw_affiliation_string":"University of Southern Queensland, Toowoomba, Australia","institution_ids":["https://openalex.org/I185523456"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100338386","display_name":"Jingjing Li","orcid":"https://orcid.org/0000-0002-5504-2529"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingjing Li","raw_affiliation_strings":["University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-5504-2529","affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101478197"],"corresponding_institution_ids":["https://openalex.org/I150229711"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.28745386,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"5080","last_page":"5089"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9825999736785889,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9750000238418579,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.6523000001907349},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6211000084877014},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5763999819755554},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.45809999108314514},{"id":"https://openalex.org/keywords/domain-adaptation","display_name":"Domain adaptation","score":0.4431000053882599},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4027999937534332},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.3982999920845032}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6732000112533569},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.6523000001907349},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6211000084877014},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5806999802589417},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5763999819755554},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.45809999108314514},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.4431000053882599},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4027999937534332},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3986999988555908},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.3982999920845032},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3481000065803528},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3034000098705292},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.2558000087738037}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746027.3755740","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755740","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8062367416","display_name":null,"funder_award_id":"52441801","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1977295328","https://openalex.org/W2047643928","https://openalex.org/W2108598243","https://openalex.org/W2138011018","https://openalex.org/W2155904486","https://openalex.org/W2533598788","https://openalex.org/W2627183927","https://openalex.org/W2887976372","https://openalex.org/W2954996726","https://openalex.org/W2962858109","https://openalex.org/W2964194231","https://openalex.org/W3037492894","https://openalex.org/W3177096435","https://openalex.org/W3198377975","https://openalex.org/W3198675127","https://openalex.org/W4312310776","https://openalex.org/W4313175608","https://openalex.org/W4382239347","https://openalex.org/W4394862623","https://openalex.org/W4400767051","https://openalex.org/W4402703115"],"related_works":[],"abstract_inverted_index":{"The":[0,103],"rich":[1],"pretrained":[2],"knowledge":[3],"in":[4,112,119],"vision-language":[5],"models":[6],"(VLMs)":[7],"endows":[8],"them":[9],"with":[10,163],"the":[11,76,115,120,133,157,181],"ability":[12],"to":[13,39,53,60,145],"discriminate":[14],"common":[15],"objects":[16],"given":[17,93],"only":[18,94],"category":[19,95],"names,":[20],"but":[21,57],"may":[22],"be":[23],"challenged":[24],"by":[25],"out-of-distribution":[26],"unlabeled":[27],"samples.":[28],"To":[29,154],"address":[30],"this":[31],"limitation,":[32],"test-time":[33],"adaptation":[34],"(TTA)":[35],"dynamically":[36],"adjusts":[37],"VLMs":[38,111],"target":[40,158],"distributions":[41],"during":[42],"inference.":[43],"Current":[44],"TTA":[45,151],"frameworks":[46],"rely":[47],"heavily":[48],"on":[49,114,174],"unsupervised":[50],"data":[51],"augmentations":[52,80],"enhance":[54],"sample":[55],"informativeness,":[56],"remain":[58],"vulnerable":[59],"naive":[61],"augmented":[62],"views.":[63],"This":[64],"work":[65],"introduces":[66],"Patch":[67],"Augmentation":[68],"(PatAug),":[69],"a":[70,164],"pixel-level":[71],"perturbation":[72],"framework":[73],"that":[74],"optimizes":[75],"benefits":[77],"of":[78,135,138,183],"informative":[79],"and":[81,169,176],"mitigates":[82],"negative":[83],"transformation":[84],"impacts.":[85],"Implemented":[86],"as":[87],"trainable":[88],"pixels,":[89],"PatAug":[90,142],"are":[91],"prepared":[92],"names":[96],"before":[97],"inference,":[98],"introducing":[99],"few":[100],"additional":[101],"overheads.":[102],"patches":[104,162],"encode":[105],"class-related":[106],"semantic":[107],"information.":[108,129],"They":[109],"assist":[110],"emphasizing":[113],"compatible":[116],"visual":[117],"information":[118],"images,":[121],"restoring":[122],"perturbed":[123],"image":[124],"details,":[125],"while":[126],"retaining":[127],"unrecognized":[128],"Such":[130],"merits":[131],"inspire":[132],"design":[134],"an":[136],"augmentation":[137,139,147],"framework,":[140],"where":[141],"is":[143],"applied":[144],"standard":[146],"views":[148],"for":[149],"reliable":[150],"inference":[152],"results.":[153],"better":[155],"fit":[156],"distributions,":[159],"we":[160],"adjust":[161],"cross-modal":[165],"similarity":[166],"alignment":[167],"loss":[168],"learnable":[170],"patching":[171],"weights.":[172],"Experiments":[173],"natural":[175],"specialized":[177],"domain":[178],"shifts":[179],"confirm":[180],"effectiveness":[182],"PatAug.":[184]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-25T00:00:00"}
