{"id":"https://openalex.org/W7154950357","doi":"https://doi.org/10.48550/arxiv.2604.15756","title":"TTL: Test-time Textual Learning for OOD Detection with Pretrained Vision-Language Models","display_name":"TTL: Test-time Textual Learning for OOD Detection with Pretrained Vision-Language Models","publication_year":2026,"publication_date":"2026-04-17","ids":{"openalex":"https://openalex.org/W7154950357","doi":"https://doi.org/10.48550/arxiv.2604.15756"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.15756","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15756","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.15756","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134033027","display_name":"Jinlun Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Jinlun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054505343","display_name":"\u5ed6\u6c5f","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liao, Jiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123458700","display_name":"Runhe Lai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lai, Runhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123494937","display_name":"Xinhua Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Xinhua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134071302","display_name":"Jiaxin Zhuang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhuang, Jiaxin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056718604","display_name":"Zhiyong Gan","orcid":"https://orcid.org/0009-0008-6451-1068"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gan, Zhiyong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134080526","display_name":"Ruixuan Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Ruixuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8292999863624573,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8292999863624573,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.09730000048875809,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.011699999682605267,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6552000045776367},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.510200023651123},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4172999858856201},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.39469999074935913},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.37529999017715454},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.3508000075817108}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7785000205039978},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6552000045776367},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5720999836921692},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.510200023651123},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.44679999351501465},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4172999858856201},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.39469999074935913},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.37529999017715454},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.3508000075817108},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34369999170303345},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3264999985694885},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.2996000051498413},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2987000048160553},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2847000062465668},{"id":"https://openalex.org/C2778828372","wikidata":"https://www.wikidata.org/wiki/Q5283209","display_name":"Distributional semantics","level":3,"score":0.27410000562667847},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.26269999146461487}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.15756","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15756","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.15756","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15756","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.641440212726593,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vision-language":[0],"models":[1],"(VLMs)":[2],"such":[3,33],"as":[4],"CLIP":[5],"exhibit":[6],"strong":[7],"Out-of-distribution":[8],"(OOD)":[9],"detection":[10,25],"capabilities":[11],"by":[12,27,109],"aligning":[13],"visual":[14],"and":[15,37,56],"textual":[16,80,140,169],"representations.":[17],"Recent":[18],"CLIP-based":[19],"test-time":[20,173],"adaptation":[21,124,170],"methods":[22],"further":[23],"improve":[24],"performance":[26],"incorporating":[28],"external":[29,89],"OOD":[30,42,58,79,90,103,114,121,133,156,174],"labels.":[31,91],"However,":[32],"labels":[34,50],"are":[35],"finite":[36],"fixed,":[38],"while":[39,125],"the":[40,54,166],"real":[41],"semantic":[43],"space":[44],"is":[45,178],"inherently":[46],"open-ended.":[47],"Consequently,":[48],"fixed":[49],"fail":[51],"to":[52,100],"represent":[53],"diverse":[55],"evolving":[57],"semantics":[59,81],"encountered":[60],"in":[61],"test":[62,84,98],"streams.":[63],"To":[64,105],"address":[65],"this":[66],"limitation,":[67],"we":[68,111],"introduce":[69,112],"Test-time":[70],"Textual":[71,134],"Learning":[72],"(TTL),":[73],"a":[74],"framework":[75],"that":[76,118,137,159],"dynamically":[77],"learns":[78],"from":[82],"unlabeled":[83],"streams,":[85],"without":[86],"relying":[87],"on":[88,150],"TTL":[92,130,160],"updates":[93],"learnable":[94],"prompts":[95],"using":[96],"pseudo-labeled":[97],"samples":[99,122],"capture":[101],"emerging":[102],"knowledge.":[104],"suppress":[106],"noise":[107],"introduced":[108],"pseudo-labels,":[110],"an":[113,132],"knowledge":[115],"purification":[116],"strategy":[117],"selects":[119],"reliable":[120],"for":[123,171],"suppressing":[126],"noise.":[127],"In":[128],"addition,":[129],"maintains":[131],"Knowledge":[135],"Bank":[136],"stores":[138],"high-quality":[139],"features,":[141],"providing":[142],"stable":[143],"score":[144],"calibration":[145],"across":[146],"batches.":[147],"Extensive":[148],"experiments":[149],"two":[151],"standard":[152],"benchmarks":[153],"with":[154],"nine":[155],"datasets":[157],"demonstrate":[158],"consistently":[161],"achieves":[162],"state-of-the-art":[163],"performance,":[164],"highlighting":[165],"value":[167],"of":[168],"robust":[172],"detection.":[175],"Our":[176],"code":[177],"available":[179],"at":[180],"https://github.com/figec/TTL.":[181]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-21T00:00:00"}
