{"id":"https://openalex.org/W4377371478","doi":"https://doi.org/10.48550/arxiv.2305.11391","title":"A Survey of Safety and Trustworthiness of Large Language Models through the Lens of Verification and Validation","display_name":"A Survey of Safety and Trustworthiness of Large Language Models through the Lens of Verification and Validation","publication_year":2023,"publication_date":"2023-05-19","ids":{"openalex":"https://openalex.org/W4377371478","doi":"https://doi.org/10.48550/arxiv.2305.11391"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2305.11391","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.11391","pdf_url":"https://arxiv.org/pdf/2305.11391","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2305.11391","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020085889","display_name":"Xiaowei Huang","orcid":"https://orcid.org/0000-0001-6267-0366"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Huang, Xiaowei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074225885","display_name":"Wenjie Ruan","orcid":"https://orcid.org/0000-0002-8311-8738"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ruan, Wenjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100352892","display_name":"Wei Huang","orcid":"https://orcid.org/0000-0003-1418-6267"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048979254","display_name":"Gaojie Jin","orcid":"https://orcid.org/0000-0003-0240-3033"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Gaojie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100650289","display_name":"Yi Dong","orcid":"https://orcid.org/0000-0003-3047-7777"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dong, Yi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113190718","display_name":"Changshun Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Changshun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109183304","display_name":"Saddek Bensalem","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bensalem, Saddek","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054272337","display_name":"Ronghui Mu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mu, Ronghui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101413852","display_name":"Qi Yi","orcid":"https://orcid.org/0000-0002-9602-9523"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi, Yi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100635681","display_name":"Xingyu Zhao","orcid":"https://orcid.org/0000-0002-3474-349X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Xingyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011694726","display_name":"Kaiwen Cai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Kaiwen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081956313","display_name":"Yanghao Zhang","orcid":"https://orcid.org/0000-0002-8499-0974"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yanghao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102402148","display_name":"Sihao Wu","orcid":"https://orcid.org/0009-0005-7032-8903"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Sihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101858900","display_name":"Peipei Xu","orcid":"https://orcid.org/0000-0002-7035-6745"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Peipei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063210265","display_name":"Dengyu Wu","orcid":"https://orcid.org/0000-0003-3699-4273"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Dengyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053978668","display_name":"Andr\u00e9 Freitas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Freitas, Andre","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5074423181","display_name":"Mustafa Mustafa","orcid":"https://orcid.org/0000-0002-8772-8023"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mustafa, Mustafa A.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":17,"corresponding_author_ids":["https://openalex.org/A5020085889"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.98580002784729,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.98580002784729,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9595000147819519,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.9290000200271606,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/trustworthiness","display_name":"Trustworthiness","score":0.7188106775283813},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6563137173652649},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.47285914421081543},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.45379364490509033},{"id":"https://openalex.org/keywords/risk-analysis","display_name":"Risk analysis (engineering)","score":0.44878458976745605},{"id":"https://openalex.org/keywords/unintended-consequences","display_name":"Unintended consequences","score":0.4430136978626251},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.42370229959487915},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.32044923305511475},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.2712818384170532},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.17909356951713562},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.17810118198394775}],"concepts":[{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.7188106775283813},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6563137173652649},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.47285914421081543},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.45379364490509033},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.44878458976745605},{"id":"https://openalex.org/C2776889888","wikidata":"https://www.wikidata.org/wiki/Q1135789","display_name":"Unintended consequences","level":2,"score":0.4430136978626251},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.42370229959487915},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.32044923305511475},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2712818384170532},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.17909356951713562},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.17810118198394775},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2305.11391","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.11391","pdf_url":"https://arxiv.org/pdf/2305.11391","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2305.11391","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2305.11391","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2305.11391","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.11391","pdf_url":"https://arxiv.org/pdf/2305.11391","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G849311619","display_name":null,"funder_award_id":"EP/T026995/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4377371478.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2120447654","https://openalex.org/W2977179488","https://openalex.org/W2144453115","https://openalex.org/W2128223750","https://openalex.org/W4238532390","https://openalex.org/W2188872161","https://openalex.org/W2961779879","https://openalex.org/W797688974","https://openalex.org/W2002978035","https://openalex.org/W2209382646"],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4,78],"exploded":[5],"a":[6],"new":[7],"heatwave":[8],"of":[9,53,101,116,128,161,170,196],"AI":[10],"for":[11,82,191],"their":[12,32,42,102,131],"ability":[13],"to":[14,31,97,119,123,156,178,192],"engage":[15],"end-users":[16],"in":[17,35],"human-level":[18],"conversations":[19],"with":[20,198],"detailed":[21],"and":[22,44,51,62,69,73,85,110,126,130,140,145,147,164,182,200],"articulate":[23],"answers":[24],"across":[25],"many":[26,36],"knowledge":[27],"domains.":[28],"In":[29,150],"response":[30],"fast":[33],"adoption":[34],"industrial":[37],"applications,":[38],"this":[39],"survey":[40],"concerns":[41],"safety":[43,125,163,181,199],"trustworthiness.":[45],"First,":[46],"we":[47,66,134],"review":[48],"known":[49],"vulnerabilities":[50],"limitations":[52],"the":[54,71,99,105,114,117,124,158,162,168,180,194],"LLMs,":[55],"categorising":[56],"them":[57],"into":[58],"inherent":[59],"issues,":[60,184],"attacks,":[61],"unintended":[63],"bugs.":[64],"Then,":[65],"consider":[67,135],"if":[68],"how":[70],"Verification":[72],"Validation":[74],"(V&amp;V)":[75],"techniques,":[76],"which":[77],"been":[79,176],"widely":[80],"developed":[81],"traditional":[83],"software":[84],"deep":[86],"learning":[87],"models":[88],"such":[89],"as":[90,94],"convolutional":[91],"neural":[92],"networks":[93],"independent":[95],"processes":[96],"check":[98],"alignment":[100,195],"implementations":[103],"against":[104],"specifications,":[106],"can":[107],"be":[108],"integrated":[109],"further":[111],"extended":[112],"throughout":[113],"lifecycle":[115],"LLMs":[118,129,197],"provide":[120],"rigorous":[121,185],"analysis":[122],"trustworthiness":[127,165,183,201],"applications.":[132],"Specifically,":[133],"four":[136],"complementary":[137],"techniques:":[138],"falsification":[139],"evaluation,":[141],"verification,":[142],"runtime":[143],"monitoring,":[144],"regulations":[146],"ethical":[148],"use.":[149],"total,":[151],"370+":[152],"references":[153],"are":[154,189],"considered":[155],"support":[157],"quick":[159],"understanding":[160],"issues":[166],"from":[167],"perspective":[169],"V&amp;V.":[171],"While":[172],"intensive":[173],"research":[174],"has":[175],"conducted":[177],"identify":[179],"yet":[186],"practical":[187],"methods":[188],"called":[190],"ensure":[193],"requirements.":[202]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":3}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
