{"id":"https://openalex.org/W4403791792","doi":"https://doi.org/10.1145/3664647.3680843","title":"GIST: Improving Parameter Efficient Fine-Tuning via Knowledge Interaction","display_name":"GIST: Improving Parameter Efficient Fine-Tuning via Knowledge Interaction","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403791792","doi":"https://doi.org/10.1145/3664647.3680843"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3680843","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680843","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114416551","display_name":"Jiacheng Ruan","orcid":"https://orcid.org/0000-0001-5469-507X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiacheng Ruan","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-5469-507X","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026260510","display_name":"Jingsheng Gao","orcid":"https://orcid.org/0000-0001-6271-0903"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingsheng Gao","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-6271-0903","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076218215","display_name":"Mingye Xie","orcid":"https://orcid.org/0000-0001-9826-9806"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingye Xie","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-9826-9806","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027871520","display_name":"Suncheng Xiang","orcid":"https://orcid.org/0000-0002-9141-6460"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Suncheng Xiang","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-9141-6460","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048053848","display_name":"Zefang Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zefang Yu","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0007-7198-3664","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100418165","display_name":"Ting Liu","orcid":"https://orcid.org/0000-0003-3489-4578"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ting Liu","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0003-3489-4578","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101704886","display_name":"Yuzhuo Fu","orcid":"https://orcid.org/0000-0001-5516-3016"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuzhuo Fu","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-5516-3016","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065871371","display_name":"Xiaoye Qu","orcid":"https://orcid.org/0000-0002-4907-3978"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4391012619","display_name":"Shanghai Artificial Intelligence Laboratory","ror":"https://ror.org/03wkvpx79","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391012619"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoye Qu","raw_affiliation_strings":["Shanghai Artificial Intelligence Laboratory, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-4907-3978","affiliations":[{"raw_affiliation_string":"Shanghai Artificial Intelligence Laboratory, Shanghai, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4391012619"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5114416551"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":1.1904,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.80672607,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"8835","last_page":"8844"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9840999841690063,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9840999841690063,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9664999842643738,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9611999988555908,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/gist","display_name":"GiST","score":0.7921031713485718},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6370543837547302},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.10875946283340454}],"concepts":[{"id":"https://openalex.org/C2775922572","wikidata":"https://www.wikidata.org/wiki/Q83567","display_name":"GiST","level":3,"score":0.7921031713485718},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6370543837547302},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.10875946283340454},{"id":"https://openalex.org/C142724271","wikidata":"https://www.wikidata.org/wiki/Q7208","display_name":"Pathology","level":1,"score":0.0},{"id":"https://openalex.org/C16930146","wikidata":"https://www.wikidata.org/wiki/Q4381253","display_name":"Stromal cell","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3664647.3680843","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680843","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1977295328","https://openalex.org/W2047643928","https://openalex.org/W2108598243","https://openalex.org/W2138011018","https://openalex.org/W2187089797","https://openalex.org/W2533598788","https://openalex.org/W2979826702","https://openalex.org/W2987861506","https://openalex.org/W3034368386","https://openalex.org/W3034695001","https://openalex.org/W3041133507","https://openalex.org/W3135939397","https://openalex.org/W3138154797","https://openalex.org/W3138516171","https://openalex.org/W4205991051","https://openalex.org/W4226512186","https://openalex.org/W4282005462","https://openalex.org/W4312651322","https://openalex.org/W4312983485","https://openalex.org/W4322766882","https://openalex.org/W4382463911","https://openalex.org/W4385573776","https://openalex.org/W4386071547","https://openalex.org/W4390873067","https://openalex.org/W4393156091","https://openalex.org/W4402727025"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2324878617","https://openalex.org/W2359581215","https://openalex.org/W3087259005","https://openalex.org/W2512571674","https://openalex.org/W2325192466","https://openalex.org/W2009098253","https://openalex.org/W3087198384"],"abstract_inverted_index":{"Recently,":[0],"the":[1,32,43,55,58,66,101,118,135,140,163,184,203,207,215,229],"Parameter":[2],"Efficient":[3],"Fine-Tuning":[4],"(PEFT)":[5],"method,":[6],"which":[7],"adjusts":[8],"or":[9],"introduces":[10,113],"fewer":[11],"trainable":[12,47,115],"parameters":[13,48,238],"to":[14,75,152,187,224],"calibrate":[15],"pre-trained":[16,63,185],"models":[17,64],"on":[18,125,202,228],"downstream":[19,50,70,126,149,189],"tasks,":[20],"has":[21],"been":[22],"a":[23,89,106,114,169,175,225],"hot":[24],"research":[25],"topic.":[26],"However,":[27],"existing":[28],"PEFT":[29,103,123,141,177,216],"methods":[30,104,124,142,178],"within":[31,179,218],"traditional":[33],"fine-tuning":[34,91],"framework":[35,111,181,221],"have":[36],"two":[37],"main":[38],"shortcomings:":[39],"1)":[40],"They":[41,53],"overlook":[42],"explicit":[44,146,154],"association":[45,147],"between":[46,57,156],"and":[49,65,80,143,158,209],"knowledge.":[51,199],"2)":[52],"neglect":[54],"interaction":[56,155,167],"intrinsic":[59],"task-agnostic":[60,157],"knowledge":[61,68,79,137,166],"of":[62,69,78,134,165,198,211,235,240],"task-specific":[67,136,159],"tasks.":[71,127,150],"These":[72],"oversights":[73],"lead":[74],"insufficient":[76],"utilization":[77],"suboptimal":[81],"performance.":[82],"To":[83],"address":[84],"these":[85],"issues,":[86],"we":[87,161],"propose":[88],"novel":[90],"framework,":[92],"named":[93],"GIST,":[94],"that":[95],"can":[96,182],"be":[97],"seamlessly":[98],"integrated":[99],"into":[100],"current":[102],"in":[105],"plug-and-play":[107],"manner.":[108],"Specifically,":[109],"our":[110,180,212,219],"first":[112],"token,":[116,120],"called":[117],"Gist":[119],"when":[121],"applying":[122],"This":[128],"token":[129],"serves":[130],"as":[131],"an":[132,145,233],"aggregator":[133],"learned":[138],"by":[139,193],"builds":[144],"with":[148,232],"Furthermore,":[151],"facilitate":[153],"knowledge,":[160],"introduce":[162],"concept":[164],"via":[168],"Bidirectional":[170],"Kullback-Leibler":[171],"Divergence":[172],"objective.":[173],"As":[174],"result,":[176],"enable":[183],"model":[186],"understand":[188],"tasks":[190],"more":[191],"comprehensively":[192],"fully":[194],"leveraging":[195],"both":[196],"types":[197],"Extensive":[200],"experiments":[201],"35":[204],"datasets":[205],"demonstrate":[206],"universality":[208],"scalability":[210],"framework.":[213],"Notably,":[214],"method":[217],"GIST":[220],"achieves":[222],"up":[223],"2.25%":[226],"increase":[227],"VTAB-1K":[230],"benchmark":[231],"addition":[234],"just":[236],"0.8K":[237],"(0.009\u0089":[239],"ViT-B/16).":[241],"The":[242],"code":[243],"is":[244],"available":[245],"at":[246],"https://github.com/JCruan519/GIST.":[247]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
