{"id":"https://openalex.org/W4385562719","doi":"https://doi.org/10.1145/3580305.3599209","title":"Foundations and Applications in Large-scale AI Models: Pre-training, Fine-tuning, and Prompt-based Learning","display_name":"Foundations and Applications in Large-scale AI Models: Pre-training, Fine-tuning, and Prompt-based Learning","publication_year":2023,"publication_date":"2023-08-04","ids":{"openalex":"https://openalex.org/W4385562719","doi":"https://doi.org/10.1145/3580305.3599209"},"language":"en","primary_location":{"id":"doi:10.1145/3580305.3599209","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1145/3580305.3599209","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055484401","display_name":"Derek Zhiyuan Cheng","orcid":"https://orcid.org/0009-0000-7943-8328"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Derek Cheng","raw_affiliation_strings":["Google Research, Mountain View, CA, USA"],"raw_orcid":"https://orcid.org/0009-0000-7943-8328","affiliations":[{"raw_affiliation_string":"Google Research, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033934770","display_name":"Dhaval Patel","orcid":"https://orcid.org/0000-0002-5449-6975"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dhaval Patel","raw_affiliation_strings":["IBM Research, New York, NY, USA"],"raw_orcid":"https://orcid.org/0000-0001-6210-0902","affiliations":[{"raw_affiliation_string":"IBM Research, New York, NY, USA","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033127375","display_name":"Linsey Pang","orcid":"https://orcid.org/0000-0002-4784-9795"},"institutions":[{"id":"https://openalex.org/I4210155268","display_name":"Salesforce (United States)","ror":"https://ror.org/057315g56","country_code":"US","type":"company","lineage":["https://openalex.org/I4210155268"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Linsey Pang","raw_affiliation_strings":["Salesforce, San Francisco, CA, USA"],"raw_orcid":"https://orcid.org/0000-0002-4784-9795","affiliations":[{"raw_affiliation_string":"Salesforce, San Francisco, CA, USA","institution_ids":["https://openalex.org/I4210155268"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046646390","display_name":"Sameep Mehta","orcid":"https://orcid.org/0000-0002-9599-1526"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sameep Mehta","raw_affiliation_strings":["IBM Research, Bengaluru, India"],"raw_orcid":"https://orcid.org/0000-0002-9599-1526","affiliations":[{"raw_affiliation_string":"IBM Research, Bengaluru, India","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028885505","display_name":"Kexin Xie","orcid":"https://orcid.org/0000-0003-0766-7206"},"institutions":[{"id":"https://openalex.org/I4210155268","display_name":"Salesforce (United States)","ror":"https://ror.org/057315g56","country_code":"US","type":"company","lineage":["https://openalex.org/I4210155268"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kexin Xie","raw_affiliation_strings":["Salesforce, San Francisco, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-0766-7206","affiliations":[{"raw_affiliation_string":"Salesforce, San Francisco, CA, USA","institution_ids":["https://openalex.org/I4210155268"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028125399","display_name":"Ed H.","orcid":"https://orcid.org/0000-0003-3230-5338"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ed H. Chi","raw_affiliation_strings":["Google Research, Mountain View, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-3230-5338","affiliations":[{"raw_affiliation_string":"Google Research, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006713797","display_name":"Wei Liu","orcid":"https://orcid.org/0000-0002-3003-1313"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Wei Liu","raw_affiliation_strings":["University of Technology Sydney, Sydney, NSW, Australia"],"raw_orcid":"https://orcid.org/0000-0002-3003-1313","affiliations":[{"raw_affiliation_string":"University of Technology Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068157871","display_name":"Nitesh V. Chawla","orcid":"https://orcid.org/0000-0003-3932-5956"},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nitesh Chawla","raw_affiliation_strings":["University of Notre Dame, Indiana, IN, USA"],"raw_orcid":"https://orcid.org/0000-0003-3932-5956","affiliations":[{"raw_affiliation_string":"University of Notre Dame, Indiana, IN, USA","institution_ids":["https://openalex.org/I107639228"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101609697","display_name":"James Bailey","orcid":"https://orcid.org/0000-0002-3769-3811"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"The University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"James Bailey","raw_affiliation_strings":["University of Melbourne, Melbourne, VIC, Australia"],"raw_orcid":"https://orcid.org/0000-0002-3769-3811","affiliations":[{"raw_affiliation_string":"University of Melbourne, Melbourne, VIC, Australia","institution_ids":["https://openalex.org/I165779595"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5055484401"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":0.2355,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.51226802,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"5853","last_page":"5854"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7862217426300049},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.7398178577423096},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5705021619796753},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5546694993972778},{"id":"https://openalex.org/keywords/paradigm-shift","display_name":"Paradigm shift","score":0.5480067133903503},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5451693534851074},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5164135098457336},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.46697568893432617},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4378819465637207},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.36015164852142334}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7862217426300049},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.7398178577423096},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5705021619796753},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5546694993972778},{"id":"https://openalex.org/C43540301","wikidata":"https://www.wikidata.org/wiki/Q689971","display_name":"Paradigm shift","level":2,"score":0.5480067133903503},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5451693534851074},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5164135098457336},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.46697568893432617},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4378819465637207},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.36015164852142334},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3580305.3599209","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1145/3580305.3599209","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7300000190734863,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":1,"referenced_works":["https://openalex.org/W3185341429"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2775506363","https://openalex.org/W3088136942","https://openalex.org/W4290852288","https://openalex.org/W2949362007","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314","https://openalex.org/W2949522393","https://openalex.org/W4289422896"],"abstract_inverted_index":{"Deep":[0],"learning":[1],"techniques":[2],"have":[3],"advanced":[4],"rapidly":[5],"in":[6,13,22,74,145,183],"recent":[7,94],"years,":[8],"leading":[9],"to":[10,87,100,112,126,169],"significant":[11],"progress":[12],"pre-trained":[14],"and":[15,39,60,79,105,123,137,148,175],"fine-tuned":[16],"large-scale":[17,152,170],"AI":[18,59,153,171],"models.":[19,154],"For":[20],"example,":[21],"the":[23,28,36,93,107,110,157,184],"natural":[24],"language":[25,80],"processing":[26],"domain,":[27],"traditional":[29],"\"pre-train,":[30,37],"fine-tune\"":[31],"paradigm":[32,103],"is":[33,98,143],"shifting":[34],"towards":[35],"prompt,":[38],"predict\"":[40],"paradigm,":[41],"which":[42,84],"has":[43,69],"achieved":[44],"great":[45],"success":[46],"on":[47,165],"many":[48],"tasks":[49,88],"across":[50],"different":[51,114],"application":[52],"domains":[53],"such":[54],"as":[55],"ChatGPT/BARD":[56],"for":[57,62,121,151],"Conversational":[58],"P5":[61],"a":[63,71,119,160],"unified":[64],"recommendation":[65],"system.":[66],"Moreover,":[67],"there":[68],"been":[70],"growing":[72],"interest":[73],"models":[75],"that":[76,178],"combine":[77],"vision":[78],"modalities":[81],"(vision-language":[82],"models)":[83],"are":[85],"applied":[86],"like":[89],"Visual":[90],"Captioning/Generation.":[91],"Considering":[92],"technological":[95],"revolution,":[96],"it":[97],"essential":[99],"emphasize":[101],"these":[102],"shifts":[104],"highlight":[106],"paradigms":[108],"with":[109],"potential":[111],"solve":[113],"tasks.":[115],"We":[116,155],"thus":[117],"provide":[118],"platform":[120],"academic":[122],"industrial":[124],"researchers":[125],"showcase":[127],"their":[128],"latest":[129],"work,":[130],"share":[131],"research":[132,142,162],"ideas,":[133],"discuss":[134],"various":[135],"challenges,":[136],"identify":[138],"areas":[139],"where":[140],"further":[141],"needed":[144],"pre-training,":[146],"fine-tuning,":[147],"prompt-learning":[149],"methods":[150],"foster":[156],"development":[158],"of":[159],"strong":[161],"community":[163],"focused":[164],"solving":[166],"challenges":[167],"related":[168],"models,":[172],"providing":[173],"superior":[174],"impactful":[176],"strategies":[177],"can":[179],"change":[180],"people's":[181],"lives":[182],"future.":[185]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-25T13:04:00.132906","created_date":"2025-10-10T00:00:00"}
