{"id":"https://openalex.org/W4412945429","doi":"https://doi.org/10.18653/v1/2025.acl-long.521","title":"Cool-Fusion: Fuse Large Language Models without Training","display_name":"Cool-Fusion: Fuse Large Language Models without Training","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412945429","doi":"https://doi.org/10.18653/v1/2025.acl-long.521"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2025.acl-long.521","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.521","pdf_url":"https://aclanthology.org/2025.acl-long.521.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.acl-long.521.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103095318","display_name":"Cong Liu","orcid":"https://orcid.org/0000-0001-5985-0876"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cong Liu","raw_affiliation_strings":["sen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"sen University","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040062188","display_name":"Xiaojun Quan","orcid":"https://orcid.org/0000-0002-8385-1083"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiaojun Quan","raw_affiliation_strings":["sen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"sen University","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060499624","display_name":"Yan Pan","orcid":"https://orcid.org/0000-0001-8527-6134"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan Pan","raw_affiliation_strings":["sen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"sen University","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103780748","display_name":"Weigang Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weigang Wu","raw_affiliation_strings":["sen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"sen University","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120218304","display_name":"Xu Chen","orcid":"https://orcid.org/0000-0001-8075-2867"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu Chen","raw_affiliation_strings":["sen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"sen University","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112410638","display_name":"Liang Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang Lin","raw_affiliation_strings":["sen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"sen University","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7588,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.8786655,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"10617","last_page":"10627"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9872000217437744,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.9014735817909241},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6589961647987366},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5218935608863831},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4456760883331299},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43377065658569336},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.380722314119339},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.16412192583084106},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.146816223859787},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.10588949918746948},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.05630406737327576}],"concepts":[{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.9014735817909241},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6589961647987366},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5218935608863831},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4456760883331299},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43377065658569336},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.380722314119339},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.16412192583084106},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.146816223859787},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.10588949918746948},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.05630406737327576},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.acl-long.521","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.521","pdf_url":"https://aclanthology.org/2025.acl-long.521.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.acl-long.521","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.521","pdf_url":"https://aclanthology.org/2025.acl-long.521.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412945429.pdf","grobid_xml":"https://content.openalex.org/works/W4412945429.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3000097931","https://openalex.org/W2354322770","https://openalex.org/W4237547500","https://openalex.org/W1570848052","https://openalex.org/W2373192430","https://openalex.org/W4239268388","https://openalex.org/W1537496349","https://openalex.org/W4390606538","https://openalex.org/W2095903272","https://openalex.org/W3204019825"],"abstract_inverted_index":{"We":[0],"focus":[1],"on":[2,82],"the":[3,21,48,74,89],"problem":[4],"of":[5,20,23,50,66,105,121],"fusing":[6],"two":[7],"or":[8,33],"more":[9],"heterogeneous":[10],"large":[11],"language":[12],"models":[13],"(LLMs)":[14],"to":[15,63,87],"leverage":[16],"their":[17],"complementary":[18],"strengths.One":[19],"challenges":[22],"model":[24],"fusion":[25],"is":[26,61],"high":[27],"computational":[28],"load,":[29],"specifically":[30],"in":[31],"fine-tuning":[32],"aligning":[34],"vocabularies.To":[35,72],"address":[36],"this,":[37],"we":[38,79],"propose":[39],"Cool-Fusion,":[40],"a":[41,103,118],"simple":[42],"yet":[43],"effective":[44],"approach":[45],"that":[46,69],"fuses":[47],"knowledge":[49],"source":[51,67,115],"LLMs,":[52,78],"which":[53],"does":[54],"not":[55],"require":[56],"training.Unlike":[57],"ensemble":[58,80],"methods,":[59],"Cool-Fusion":[60,109],"applicable":[62],"any":[64],"set":[65],"LLMs":[68,81,116],"have":[70,99],"different":[71,96],"overcome":[73],"vocabulary":[75],"discrepancies":[76],"among":[77],"text":[83],"level,":[84],"allowing":[85],"them":[86],"rerank":[88],"generated":[90],"texts":[91],"by":[92,117],"each":[93],"other":[94],"with":[95],"granularities.Extensive":[97],"experiments":[98],"been":[100],"conducted":[101],"across":[102],"variety":[104],"benchmark":[106],"datasets.On":[107],"GSM8K,":[108],"increases":[110],"accuracy":[111],"from":[112],"three":[113],"strong":[114],"significant":[119],"margin":[120],"17.4%.":[122]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
