{"id":"https://openalex.org/W4390489727","doi":"https://doi.org/10.48550/arxiv.2312.17484","title":"Truth Forest: Toward Multi-Scale Truthfulness in Large Language Models through Intervention without Tuning","display_name":"Truth Forest: Toward Multi-Scale Truthfulness in Large Language Models through Intervention without Tuning","publication_year":2023,"publication_date":"2023-12-29","ids":{"openalex":"https://openalex.org/W4390489727","doi":"https://doi.org/10.48550/arxiv.2312.17484"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2312.17484","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.17484","pdf_url":"https://arxiv.org/pdf/2312.17484","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2312.17484","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038929048","display_name":"Zhongzhi Chen","orcid":"https://orcid.org/0000-0002-1954-3027"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Zhongzhi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039337290","display_name":"Xingwu Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Xingwu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102133077","display_name":"Xianfeng Jiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiao, Xianfeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091705422","display_name":"Fengzong Lian","orcid":"https://orcid.org/0000-0002-9871-3038"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lian, Fengzong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020128898","display_name":"Zhanhui Kang","orcid":"https://orcid.org/0009-0006-5151-4222"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kang, Zhanhui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100401482","display_name":"Di Wang","orcid":"https://orcid.org/0000-0003-4908-0243"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Di","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5012773300","display_name":"Chengzhong Xu","orcid":"https://orcid.org/0000-0001-9480-0356"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Cheng-Zhong","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5038929048"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9865999817848206,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.6569768190383911},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.6433538198471069},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5822514295578003},{"id":"https://openalex.org/keywords/intervention","display_name":"Intervention (counseling)","score":0.5221688747406006},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.47826969623565674},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.4737858474254608},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4566274583339691},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.45113900303840637},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3930380344390869},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.3095036745071411},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.14601930975914001},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.12418591976165771},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08294972777366638}],"concepts":[{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.6569768190383911},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.6433538198471069},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5822514295578003},{"id":"https://openalex.org/C2780665704","wikidata":"https://www.wikidata.org/wiki/Q959298","display_name":"Intervention (counseling)","level":2,"score":0.5221688747406006},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.47826969623565674},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.4737858474254608},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4566274583339691},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.45113900303840637},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3930380344390869},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3095036745071411},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.14601930975914001},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.12418591976165771},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08294972777366638},{"id":"https://openalex.org/C118552586","wikidata":"https://www.wikidata.org/wiki/Q7867","display_name":"Psychiatry","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2312.17484","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.17484","pdf_url":"https://arxiv.org/pdf/2312.17484","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2312.17484","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2312.17484","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2312.17484","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.17484","pdf_url":"https://arxiv.org/pdf/2312.17484","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G137162417","display_name":null,"funder_award_id":"2020B151513000","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G3992403265","display_name":null,"funder_award_id":"2020B1515130004","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"}],"funders":[{"id":"https://openalex.org/F4320337111","display_name":"Basic and Applied Basic Research Foundation of Guangdong Province","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4390489727.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3193043704","https://openalex.org/W4386259002","https://openalex.org/W1546989560","https://openalex.org/W3171520305","https://openalex.org/W2068608913","https://openalex.org/W3135126032","https://openalex.org/W1924178503","https://openalex.org/W4295532600","https://openalex.org/W4308716060","https://openalex.org/W2063823869"],"abstract_inverted_index":{"Despite":[0],"the":[1,51,68,71,87,131,135],"great":[2],"success":[3],"of":[4,65,89,110,134],"large":[5],"language":[6],"models":[7],"(LLMs)":[8],"in":[9,26,79,102],"various":[10],"tasks,":[11],"they":[12],"suffer":[13],"from":[14,91],"generating":[15,76],"hallucinations.":[16],"We":[17,105],"introduce":[18,55],"Truth":[19],"Forest,":[20],"a":[21,58,107],"method":[22],"that":[23,119,129],"enhances":[24],"truthfulness":[25,88],"LLMs":[27],"by":[28,46],"uncovering":[29],"hidden":[30],"truth":[31,45,77,111],"representations":[32],"using":[33,113],"multi-dimensional":[34],"orthogonal":[35,41,48,120],"probes.":[36,52,114],"Specifically,":[37],"it":[38],"creates":[39],"multiple":[40],"bases":[42],"for":[43],"modeling":[44],"incorporating":[47],"constraints":[49],"into":[50],"Moreover,":[53],"we":[54,85],"Random":[56],"Peek,":[57],"systematic":[59],"technique":[60],"considering":[61],"an":[62],"extended":[63],"range":[64],"positions":[66],"within":[67],"sequence,":[69],"reducing":[70],"gap":[72],"between":[73],"discerning":[74],"and":[75],"features":[78,112],"LLMs.":[80],"By":[81],"employing":[82],"this":[83],"approach,":[84],"improved":[86],"Llama-2-7B":[90],"40.8\\%":[92],"to":[93],"74.5\\%":[94],"on":[95],"TruthfulQA.":[96],"Likewise,":[97],"significant":[98],"improvements":[99],"are":[100],"observed":[101],"fine-tuned":[103],"models.":[104],"conducted":[106],"thorough":[108],"analysis":[109],"Our":[115],"visualization":[116],"results":[117],"show":[118],"probes":[121],"capture":[122],"complementary":[123],"truth-related":[124],"features,":[125],"forming":[126],"well-defined":[127],"clusters":[128],"reveal":[130],"inherent":[132],"structure":[133],"dataset.":[136]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
