{"id":"https://openalex.org/W4392182003","doi":"https://doi.org/10.48550/arxiv.2402.15017","title":"Towards Few-Shot Adaptation of Foundation Models via Multitask Finetuning","display_name":"Towards Few-Shot Adaptation of Foundation Models via Multitask Finetuning","publication_year":2024,"publication_date":"2024-02-22","ids":{"openalex":"https://openalex.org/W4392182003","doi":"https://doi.org/10.48550/arxiv.2402.15017"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2402.15017","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.15017","pdf_url":"https://arxiv.org/pdf/2402.15017","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2402.15017","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113127899","display_name":"Zhuoyan Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Xu, Zhuoyan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069272192","display_name":"Zhenmei Shi","orcid":"https://orcid.org/0009-0007-6741-7598"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Zhenmei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101456098","display_name":"Junyi Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Junyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029753270","display_name":"Fangzhou Mu","orcid":"https://orcid.org/0000-0001-5580-2404"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mu, Fangzhou","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100451116","display_name":"Yin Li","orcid":"https://orcid.org/0000-0002-2635-6633"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100316775","display_name":"Yingyu Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Yingyu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5113127899"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12293","display_name":"Dam Engineering and Safety","score":0.9649999737739563,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12293","display_name":"Dam Engineering and Safety","score":0.9649999737739563,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11606","display_name":"Infrastructure Maintenance and Monitoring","score":0.9455999732017517,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11046","display_name":"Geotechnical Engineering and Analysis","score":0.9304999709129333,"subfield":{"id":"https://openalex.org/subfields/2213","display_name":"Safety, Risk, Reliability and Quality"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.629165768623352},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.6158130168914795},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4891569912433624},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.22759759426116943},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.17024368047714233},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.08062401413917542}],"concepts":[{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.629165768623352},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.6158130168914795},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4891569912433624},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.22759759426116943},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.17024368047714233},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.08062401413917542},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2402.15017","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.15017","pdf_url":"https://arxiv.org/pdf/2402.15017","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2402.15017","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2402.15017","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2402.15017","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.15017","pdf_url":"https://arxiv.org/pdf/2402.15017","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1567685964","display_name":"CAREER: Towards Better Understanding, Robustness, and Efficiency of Deep Learning","funder_award_id":"2046710","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4207694608","display_name":null,"funder_award_id":"CCF-2046710","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5632738584","display_name":null,"funder_award_id":"2023239","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6312673494","display_name":"Collaborative Research: RI: Small: Theoretical Foundations: TheAdvantage of Deep Learning over Traditional Shallow Learning Methods","funder_award_id":"2008559","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4392182003.pdf","grobid_xml":"https://content.openalex.org/works/W4392182003.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2381393187","https://openalex.org/W2332779545","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2358060160","https://openalex.org/W2035483685","https://openalex.org/W1969764885","https://openalex.org/W2376932109","https://openalex.org/W2001405890"],"abstract_inverted_index":{"Foundation":[0],"models":[1,182],"have":[2],"emerged":[3],"as":[4],"a":[5,49,53,62,88,132],"powerful":[6],"tool":[7],"for":[8],"many":[9],"AI":[10],"problems.":[11],"Despite":[12],"the":[13,74,102,110,116,163,177],"tremendous":[14],"success":[15,42],"of":[16,55,77,91,180],"foundation":[17,50,181],"models,":[18],"effective":[19,178],"adaptation":[20,60,179],"to":[21,61,98,107,162,183],"new":[22,174,184],"tasks,":[23,57,93,159],"particularly":[24],"those":[25],"with":[26,40,65,87,142],"limited":[27,66],"labels,":[28],"remains":[29],"an":[30],"open":[31],"question":[32],"and":[33,45,121,126,129],"lacks":[34],"theoretical":[35,75,83,140],"understanding.":[36],"An":[37],"emerging":[38],"solution":[39],"recent":[41],"in":[43,101,105],"vision":[44],"NLP":[46],"involves":[47],"finetuning":[48,80,96,119,158],"model":[51,164],"on":[52,166,176],"selection":[54,135,153],"relevant":[56],"before":[58],"its":[59],"target":[63,103,122,167],"task":[64,134,152],"labeled":[67],"samples.":[68],"In":[69],"this":[70,78,94],"paper,":[71],"we":[72,147],"study":[73,172],"justification":[76],"multitask":[79,95],"approach.":[81],"Our":[82,190],"analysis":[84],"reveals":[85],"that":[86,186],"diverse":[89],"set":[90],"related":[92,157],"leads":[97],"reduced":[99],"error":[100],"task,":[104],"comparison":[106],"directly":[108],"adapting":[109],"same":[111],"pretrained":[112],"model.":[113],"We":[114,137,169],"quantify":[115],"relationship":[117],"between":[118],"tasks":[120,123,185],"by":[124],"diversity":[125],"consistency":[127],"metrics,":[128],"further":[130],"propose":[131],"practical":[133],"algorithm.":[136],"substantiate":[138],"our":[139,151,171],"claims":[141],"extensive":[143],"empirical":[144],"evidence.":[145],"Further,":[146],"present":[148],"results":[149],"affirming":[150],"algorithm":[154],"adeptly":[155],"chooses":[156],"providing":[160],"advantages":[161],"performance":[165],"tasks.":[168],"believe":[170],"shed":[173],"light":[175],"lack":[187],"abundant":[188],"labels.":[189],"code":[191],"is":[192],"available":[193],"at":[194],"https://github.com/OliverXUZY/Foudation-Model_Multitask.":[195]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2024-02-27T00:00:00"}
