{"id":"https://openalex.org/W4286229627","doi":"https://doi.org/10.48550/arxiv.2207.08408","title":"STT: Soft Template Tuning for Few-Shot Adaptation","display_name":"STT: Soft Template Tuning for Few-Shot Adaptation","publication_year":2022,"publication_date":"2022-07-18","ids":{"openalex":"https://openalex.org/W4286229627","doi":"https://doi.org/10.48550/arxiv.2207.08408"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2207.08408","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2207.08408","pdf_url":"https://arxiv.org/pdf/2207.08408","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2207.08408","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100623508","display_name":"Ping Yu","orcid":"https://orcid.org/0000-0002-8913-873X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yu, Ping","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100391888","display_name":"Wei Wang","orcid":"https://orcid.org/0000-0002-1568-2396"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107893340","display_name":"Chunyuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chunyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101424484","display_name":"Ruiyi Zhang","orcid":"https://orcid.org/0000-0002-4776-6762"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Ruiyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044439388","display_name":"Zhanpeng Jin","orcid":"https://orcid.org/0000-0002-3020-3736"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Zhanpeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5114686221","display_name":"Changyou Chen","orcid":"https://orcid.org/0000-0002-9877-8448"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Changyou","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100623508"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.982200026512146,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8462517857551575},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.6351630091667175},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6264333128929138},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4902692139148712},{"id":"https://openalex.org/keywords/fine-tuning","display_name":"Fine-tuning","score":0.45497632026672363},{"id":"https://openalex.org/keywords/downstream","display_name":"Downstream (manufacturing)","score":0.45190587639808655},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4331277906894684},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.41429704427719116},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41138333082199097},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.06639367341995239}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8462517857551575},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.6351630091667175},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6264333128929138},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4902692139148712},{"id":"https://openalex.org/C157524613","wikidata":"https://www.wikidata.org/wiki/Q2828883","display_name":"Fine-tuning","level":2,"score":0.45497632026672363},{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.45190587639808655},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4331277906894684},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.41429704427719116},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41138333082199097},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.06639367341995239},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2207.08408","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2207.08408","pdf_url":"https://arxiv.org/pdf/2207.08408","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.2207.08408","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2207.08408","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2207.08408","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2207.08408","pdf_url":"https://arxiv.org/pdf/2207.08408","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8","score":0.4300000071525574}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4286229627.pdf","grobid_xml":"https://content.openalex.org/works/W4286229627.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2074502265","https://openalex.org/W4214877189","https://openalex.org/W2773965352","https://openalex.org/W2381179799","https://openalex.org/W2980279061","https://openalex.org/W2334685461","https://openalex.org/W1583765404","https://openalex.org/W2366718574","https://openalex.org/W2359774528","https://openalex.org/W4298312966"],"abstract_inverted_index":{"Prompt":[0],"tuning":[1,76,100],"has":[2],"been":[3],"an":[4],"extremely":[5],"effective":[6],"tool":[7],"to":[8,13,40],"adapt":[9],"a":[10,96,113,134],"pre-trained":[11],"model":[12],"downstream":[14,28,52,130],"tasks.":[15,29,173],"However,":[16],"standard":[17],"prompt-based":[18,153],"methods":[19,70,154],"mainly":[20],"consider":[21],"the":[22,35,41,59,64,67,109,148,164],"case":[23],"of":[24,27,61],"sufficient":[25],"data":[26,47,81],"It":[30],"is":[31,94],"still":[32,83,95],"unclear":[33],"whether":[34],"advantage":[36],"can":[37,146,161],"be":[38],"transferred":[39],"few-shot":[42,65,105],"regime,":[43],"where":[44],"only":[45],"limited":[46,80],"are":[48,82],"available":[49],"for":[50,104],"each":[51],"task.":[53,138],"Although":[54],"some":[55],"works":[56],"have":[57],"demonstrated":[58],"potential":[60],"prompt-tuning":[62,115],"under":[63],"setting,":[66],"main":[68],"stream":[69],"via":[71],"searching":[72],"discrete":[73],"prompts":[74,78],"or":[75],"soft":[77],"with":[79],"very":[84],"challenging.":[85],"Through":[86],"extensive":[87],"empirical":[88],"studies,":[89],"we":[90,111],"find":[91],"that":[92],"there":[93],"gap":[97,149],"between":[98,150],"prompt":[99],"and":[101,125,128,152,166],"fully":[102],"fine-tuning":[103,151,168],"learning.":[106],"To":[107],"bridge":[108],"gap,":[110],"propose":[112],"new":[114],"framework,":[116],"called":[117],"Soft":[118],"Template":[119],"Tuning":[120],"(STT).":[121],"STT":[122,145],"combines":[123],"manual":[124],"auto":[126],"prompts,":[127],"treats":[129],"classification":[131,172],"tasks":[132],"as":[133],"masked":[135],"language":[136],"modeling":[137],"Comprehensive":[139],"evaluation":[140],"on":[141,170],"different":[142],"settings":[143],"suggests":[144],"close":[147],"without":[155],"introducing":[156],"additional":[157],"parameters.":[158],"Significantly,":[159],"it":[160],"even":[162],"outperform":[163],"time-":[165],"resource-consuming":[167],"method":[169],"sentiment":[171]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
