{"id":"https://openalex.org/W4386755382","doi":"https://doi.org/10.48550/arxiv.2309.06809","title":"TAP: Targeted Prompting for Task Adaptive Generation of Textual Training Instances for Visual Classification","display_name":"TAP: Targeted Prompting for Task Adaptive Generation of Textual Training Instances for Visual Classification","publication_year":2023,"publication_date":"2023-09-13","ids":{"openalex":"https://openalex.org/W4386755382","doi":"https://doi.org/10.48550/arxiv.2309.06809"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2309.06809","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.06809","pdf_url":"https://arxiv.org/pdf/2309.06809","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2309.06809","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113181018","display_name":"M. Jehanzeb Mirza","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Mirza, M. Jehanzeb","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020676344","display_name":"Leonid Karlinsky","orcid":"https://orcid.org/0000-0003-2524-2068"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Karlinsky, Leonid","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008915926","display_name":"Wei Lin","orcid":"https://orcid.org/0000-0003-1597-0993"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039382695","display_name":"Horst Possegger","orcid":"https://orcid.org/0000-0002-5427-9938"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Possegger, Horst","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052325109","display_name":"Rog\u00e9rio Feris","orcid":"https://orcid.org/0000-0001-6399-0679"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feris, Rogerio","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5011359067","display_name":"Horst Bischof","orcid":"https://orcid.org/0000-0002-9096-6671"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bischof, Horst","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5113181018"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.9760000109672546,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7766404747962952},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7180903553962708},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5991157293319702},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.5767172574996948},{"id":"https://openalex.org/keywords/domain-adaptation","display_name":"Domain adaptation","score":0.5685961842536926},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.5383682250976562},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5163372755050659},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47984620928764343},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.4684128165245056},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.46641620993614197},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4278465211391449},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4272312521934509},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.41733318567276},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3604575991630554},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.14277425408363342},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.08105558156967163}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7766404747962952},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7180903553962708},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5991157293319702},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.5767172574996948},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.5685961842536926},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.5383682250976562},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5163372755050659},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47984620928764343},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.4684128165245056},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.46641620993614197},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4278465211391449},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4272312521934509},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.41733318567276},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3604575991630554},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.14277425408363342},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.08105558156967163},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2309.06809","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.06809","pdf_url":"https://arxiv.org/pdf/2309.06809","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2309.06809","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2309.06809","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2309.06809","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.06809","pdf_url":"https://arxiv.org/pdf/2309.06809","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.800000011920929}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4386755382.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3035557009","https://openalex.org/W3204418343","https://openalex.org/W2341113105","https://openalex.org/W2955172689","https://openalex.org/W3132602785","https://openalex.org/W3046182208","https://openalex.org/W2343346879","https://openalex.org/W2186589590","https://openalex.org/W2531741693","https://openalex.org/W4297818280"],"abstract_inverted_index":{"Vision":[0],"and":[1,74,107,159],"Language":[2,91],"Models":[3,92],"(VLMs),":[4],"such":[5],"as":[6],"CLIP,":[7],"have":[8],"enabled":[9],"visual":[10,27,81],"recognition":[11,28,82],"of":[12,17,41,119],"a":[13],"potentially":[14],"unlimited":[15],"set":[16],"categories":[18],"described":[19],"by":[20,89],"text":[21,127],"prompts.":[22],"However,":[23],"for":[24],"the":[25,38,42,49,53,117,120,135],"best":[26],"performance,":[29],"these":[30],"models":[31],"still":[32],"require":[33],"tuning":[34],"to":[35,47,66,77,134,144,153,168],"better":[36],"fit":[37],"data":[39,87,128],"distributions":[40],"downstream":[43,121],"tasks,":[44],"in":[45,75,148,156,164],"order":[46],"overcome":[48],"domain":[50],"shift":[51],"from":[52,129],"web-based":[54],"pre-training":[55],"data.":[56],"Recently,":[57],"it":[58,63,110],"has":[59],"been":[60],"shown":[61],"that":[62],"is":[64],"possible":[65],"effectively":[67,78],"tune":[68],"VLMs":[69,80],"without":[70],"any":[71],"paired":[72],"data,":[73],"particular":[76],"improve":[79],"performance":[83,146],"using":[84],"text-only":[85,103,137],"training":[86,105,139],"generated":[88],"Large":[90],"(LLMs).":[93],"In":[94,131],"this":[95,101],"paper,":[96],"we":[97,141],"dive":[98],"deeper":[99],"into":[100,123],"exciting":[102],"VLM":[104,138],"approach":[106],"explore":[108],"ways":[109],"can":[111],"be":[112],"significantly":[113],"further":[114],"improved":[115],"taking":[116],"specifics":[118],"task":[122],"account":[124],"when":[125],"sampling":[126],"LLMs.":[130],"particular,":[132],"compared":[133,167],"SOTA":[136],"approach,":[140],"demonstrate":[142],"up":[143,152],"8.4%":[145],"improvement":[147,155,163],"(cross)":[149],"domain-specific":[150],"adaptation,":[151],"8.7%":[154],"fine-grained":[157],"recognition,":[158],"3.1%":[160],"overall":[161],"average":[162],"zero-shot":[165],"classification":[166],"strong":[169],"baselines.":[170]},"counts_by_year":[],"updated_date":"2026-03-14T08:43:22.919905","created_date":"2023-09-15T00:00:00"}
