{"id":"https://openalex.org/W4412888436","doi":"https://doi.org/10.18653/v1/2025.findings-acl.361","title":"LLM-Forest: Ensemble Learning of LLMs with Graph-Augmented Prompts for Data Imputation","display_name":"LLM-Forest: Ensemble Learning of LLMs with Graph-Augmented Prompts for Data Imputation","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412888436","doi":"https://doi.org/10.18653/v1/2025.findings-acl.361"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2025.findings-acl.361","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.findings-acl.361","pdf_url":"https://aclanthology.org/2025.findings-acl.361.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: ACL 2025","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.findings-acl.361.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103129896","display_name":"Xinrui He","orcid":"https://orcid.org/0009-0001-8526-873X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xinrui He","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110849539","display_name":"Yikun Ban","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yikun Ban","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051330767","display_name":"Jiaru Zou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiaru Zou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024869027","display_name":"Tianxin Wei","orcid":"https://orcid.org/0000-0003-4450-2005"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tianxin Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066496796","display_name":"Curtiss B. Cook","orcid":"https://orcid.org/0000-0001-5885-9959"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Curtiss Cook","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5003062659","display_name":"Jingrui He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jingrui He","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":7.0351,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.96665091,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"6921","last_page":"6936"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9675999879837036,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9675999879837036,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9391000270843506,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9327999949455261,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imputation","display_name":"Imputation (statistics)","score":0.7374538779258728},{"id":"https://openalex.org/keywords/ensemble-learning","display_name":"Ensemble learning","score":0.6466408967971802},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6278426647186279},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4948238730430603},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4450145959854126},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4010418653488159},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.2249026596546173},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.12367776036262512}],"concepts":[{"id":"https://openalex.org/C58041806","wikidata":"https://www.wikidata.org/wiki/Q1660484","display_name":"Imputation (statistics)","level":3,"score":0.7374538779258728},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.6466408967971802},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6278426647186279},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4948238730430603},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4450145959854126},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4010418653488159},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.2249026596546173},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.12367776036262512}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.findings-acl.361","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.findings-acl.361","pdf_url":"https://aclanthology.org/2025.findings-acl.361.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: ACL 2025","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.findings-acl.361","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.findings-acl.361","pdf_url":"https://aclanthology.org/2025.findings-acl.361.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: ACL 2025","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Climate action","score":0.6800000071525574,"id":"https://metadata.un.org/sdg/13"}],"awards":[{"id":"https://openalex.org/G7374246537","display_name":"III: Small: RareXplain: A Computational Framework for Explainable Rare Category Analysis","funder_award_id":"2117902","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412888436.pdf","grobid_xml":"https://content.openalex.org/works/W4412888436.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4387369504","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"Missing":[0],"data":[1,16,35,43],"imputation":[2],"is":[3,18,102,137],"a":[4,39,52,69,75,105],"critical":[5],"challenge":[6],"in":[7,34,47,56,61],"various":[8],"domains,":[9],"such":[10],"as":[11],"healthcare":[12],"and":[13,55,59,121,132],"finance,":[14],"where":[15],"completeness":[17],"vital":[19],"for":[20,42,51],"accurate":[21],"analysis.Large":[22],"language":[23],"models":[24],"(LLMs),":[25],"trained":[26],"on":[27,91,104,125],"vast":[28],"corpora,":[29],"have":[30],"shown":[31],"strong":[32],"potential":[33],"generation,":[36],"making":[37],"them":[38],"promising":[40],"tool":[41],"imputation.However,":[44],"challenges":[45],"persist":[46],"designing":[48],"effective":[49],"prompts":[50],"finetuning-free":[53],"process":[54],"mitigating":[57],"biases":[58],"uncertainty":[60],"LLM":[62,80,92],"outputs.To":[63],"address":[64],"these":[65],"issues,":[66],"we":[67],"propose":[68],"novel":[70],"framework,":[71],"LLM-Forest,":[72],"which":[73],"introduces":[74],"\"forest\"":[76],"of":[77,108,134],"few-shot":[78],"learning":[79,98],"\"trees\"":[81],"with":[82,118],"their":[83],"outputs":[84],"aggregated":[85],"via":[86],"confidence-based":[87],"weighted":[88],"voting":[89],"based":[90],"self-assessment,":[93],"inspired":[94],"by":[95],"the":[96,130],"ensemble":[97],"(Random":[99],"Forest).This":[100],"framework":[101],"established":[103],"new":[106],"concept":[107],"bipartite":[109],"information":[110],"graphs":[111],"to":[112],"identify":[113],"high-quality":[114],"relevant":[115],"neighboring":[116],"entries":[117],"both":[119],"feature":[120],"value":[122],"granularity.Extensive":[123],"experiments":[124],"9":[126],"real-world":[127],"datasets":[128],"demonstrate":[129],"effectiveness":[131],"efficiency":[133],"LLM-Forest.The":[135],"implementation":[136],"available":[138],"at":[139],"https:":[140]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
