{"id":"https://openalex.org/W4414359857","doi":"https://doi.org/10.24963/ijcai.2025/693","title":"Connecting Giants: Synergistic Knowledge Transfer of Large Multimodal Models for Few-Shot Learning","display_name":"Connecting Giants: Synergistic Knowledge Transfer of Large Multimodal Models for Few-Shot Learning","publication_year":2025,"publication_date":"2025-09-01","ids":{"openalex":"https://openalex.org/W4414359857","doi":"https://doi.org/10.24963/ijcai.2025/693"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2025/693","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/693","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://ink.library.smu.edu.sg/sis_research/10790","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005624589","display_name":"Hao Tang","orcid":"https://orcid.org/0000-0002-6973-8121"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Hao Tang","raw_affiliation_strings":["The Hong Kong Polytechnic University"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114190795","display_name":"Shengfeng He","orcid":null},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Shengfeng He","raw_affiliation_strings":["Singapore Management University"],"affiliations":[{"raw_affiliation_string":"Singapore Management University","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100662807","display_name":"Jing Qin","orcid":"https://orcid.org/0000-0002-7059-0929"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jing Qin","raw_affiliation_strings":["The Hong Kong Polytechnic University"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5005624589"],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":14.4341,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.98680242,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"6227","last_page":"6235"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.8435999751091003,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.8435999751091003,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.8241999745368958,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11609","display_name":"Geophysical Methods and Applications","score":0.7889000177383423,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6590999960899353},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.5461000204086304},{"id":"https://openalex.org/keywords/knowledge-transfer","display_name":"Knowledge transfer","score":0.5157999992370605},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.45239999890327454},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.44589999318122864},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.42879998683929443},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4083000123500824},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.391400009393692}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7796000242233276},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6590999960899353},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.5461000204086304},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5367000102996826},{"id":"https://openalex.org/C2776960227","wikidata":"https://www.wikidata.org/wiki/Q2586354","display_name":"Knowledge transfer","level":2,"score":0.5157999992370605},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48489999771118164},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.45239999890327454},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.44589999318122864},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.42879998683929443},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4083000123500824},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.391400009393692},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.36980000138282776},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.36320000886917114},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.35190001130104065},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.3305000066757202},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32089999318122864},{"id":"https://openalex.org/C2777220311","wikidata":"https://www.wikidata.org/wiki/Q6423340","display_name":"Knowledge acquisition","level":2,"score":0.31679999828338623},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.2897999882698059},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.2865000069141388},{"id":"https://openalex.org/C56814567","wikidata":"https://www.wikidata.org/wiki/Q1323686","display_name":"Explicit knowledge","level":2,"score":0.2831999957561493},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.2802000045776367},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.26489999890327454},{"id":"https://openalex.org/C197914299","wikidata":"https://www.wikidata.org/wiki/Q18650","display_name":"Semantic memory","level":3,"score":0.2646999955177307},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.2563999891281128},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.25209999084472656}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.24963/ijcai.2025/693","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/693","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},{"id":"pmh:oai:ink.library.smu.edu.sg:sis_research-11792","is_oa":true,"landing_page_url":"https://ink.library.smu.edu.sg/sis_research/10790","pdf_url":null,"source":{"id":"https://openalex.org/S4306401925","display_name":"Singapore Management University Institutional Knowledge (InK) (Singapore Management University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79891267","host_organization_name":"Singapore Management University","host_organization_lineage":["https://openalex.org/I79891267"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://doi.org/10.24963/ijcai.2025/693","raw_type":"Conference Proceeding Article"}],"best_oa_location":{"id":"pmh:oai:ink.library.smu.edu.sg:sis_research-11792","is_oa":true,"landing_page_url":"https://ink.library.smu.edu.sg/sis_research/10790","pdf_url":null,"source":{"id":"https://openalex.org/S4306401925","display_name":"Singapore Management University Institutional Knowledge (InK) (Singapore Management University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79891267","host_organization_name":"Singapore Management University","host_organization_lineage":["https://openalex.org/I79891267"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://doi.org/10.24963/ijcai.2025/693","raw_type":"Conference Proceeding Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Few-shot":[0],"learning":[1],"(FSL)":[2],"addresses":[3],"the":[4,36,65],"challenge":[5],"of":[6],"classifying":[7],"novel":[8,46],"classes":[9],"with":[10,172],"limited":[11],"training":[12],"samples.":[13],"While":[14],"some":[15],"methods":[16],"leverage":[17],"semantic":[18,112,128,135,150],"knowledge":[19,58,90,100,123,136],"from":[20,59],"smaller-scale":[21],"models":[22,62,108],"to":[23,35,63,109,153],"mitigate":[24],"data":[25],"scarcity,":[26],"these":[27],"approaches":[28],"often":[29],"introduce":[30],"noise":[31],"and":[32,56,77,127,133,148],"bias":[33],"due":[34],"data\u2019s":[37],"inherent":[38],"simplicity.":[39],"In":[40],"this":[41],"paper,":[42],"we":[43],"propose":[44],"a":[45,74,79,84,97,117,144,149,173],"framework,":[47],"Synergistic":[48],"Knowledge":[49],"Transfer":[50],"(SynTrans),":[51],"which":[52],"effectively":[53],"transfers":[54],"diverse":[55],"complementary":[57],"large":[60,106],"multimodal":[61,107,157],"empower":[64],"off-the-shelf":[66],"few-shot":[67,80,175],"learner.":[68],"Specifically,":[69],"SynTrans":[70,142],"employs":[71],"CLIP":[72],"as":[73,83],"robust":[75],"teacher":[76],"uses":[78],"vision":[81,176],"encoder":[82],"weak":[85],"student,":[86],"distilling":[87],"semantic-aligned":[88],"visual":[89,126,132,145],"via":[91],"an":[92],"unsupervised":[93],"proxy":[94],"task.":[95],"Subsequently,":[96],"training-free":[98],"synergistic":[99],"mining":[101],"module":[102,120],"facilitates":[103],"collaboration":[104],"among":[105],"extract":[110],"high-quality":[111],"knowledge.":[113],"Building":[114],"upon":[115],"this,":[116],"visual-semantic":[118],"bridging":[119],"enables":[121],"bi-directional":[122],"transfer":[124],"between":[125],"spaces,":[129],"transforming":[130],"explicit":[131],"implicit":[134],"into":[137],"category-specific":[138],"classifier":[139],"weights.":[140],"Finally,":[141],"introduces":[143],"weight":[146,151],"generator":[147],"reconstructor":[152],"adaptively":[154],"construct":[155],"optimal":[156],"FSL":[158,164],"classifiers.":[159],"Experimental":[160],"results":[161],"on":[162],"four":[163],"datasets":[165],"demonstrate":[166],"that":[167],"SynTrans,":[168],"even":[169],"when":[170],"paired":[171],"simple":[174],"encoder,":[177],"significantly":[178],"outperforms":[179],"current":[180],"state-of-the-art":[181],"methods.":[182]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
