{"id":"https://openalex.org/W7148702757","doi":"https://doi.org/10.48550/arxiv.2604.01444","title":"Cooking Up Risks: Benchmarking and Reducing Food Safety Risks in Large Language Models","display_name":"Cooking Up Risks: Benchmarking and Reducing Food Safety Risks in Large Language Models","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148702757","doi":"https://doi.org/10.48550/arxiv.2604.01444"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.01444","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01444","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.01444","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102600282","display_name":"Weidi Luo","orcid":"https://orcid.org/0000-0001-9244-4677"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Luo, Weidi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120586901","display_name":"Xiaofei Wen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Xiaofei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132894795","display_name":"Tenghao Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Tenghao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132858980","display_name":"Hongyi Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Hongyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132833085","display_name":"Zhen Xiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiang, Zhen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132887792","display_name":"Chaowei Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Chaowei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031039880","display_name":"Kristina Gligori\u0107","orcid":"https://orcid.org/0000-0001-8726-740X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gligori\u0107, Kristina","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132900141","display_name":"Muhao Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Muhao","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5102600282"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.3695000112056732,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.3695000112056732,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.07020000368356705,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11610","display_name":"Food Security and Health in Diverse Populations","score":0.04560000076889992,"subfield":{"id":"https://openalex.org/subfields/3600","display_name":"General Health Professions"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/food-safety","display_name":"Food safety","score":0.6495000123977661},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.5906999707221985},{"id":"https://openalex.org/keywords/risk-assessment","display_name":"Risk assessment","score":0.4690000116825104},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.4595000147819519},{"id":"https://openalex.org/keywords/safeguard","display_name":"Safeguard","score":0.42250001430511475},{"id":"https://openalex.org/keywords/risk-management","display_name":"Risk management","score":0.350600004196167}],"concepts":[{"id":"https://openalex.org/C516717267","wikidata":"https://www.wikidata.org/wiki/Q909821","display_name":"Food safety","level":2,"score":0.6495000123977661},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.6039000153541565},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.5906999707221985},{"id":"https://openalex.org/C12174686","wikidata":"https://www.wikidata.org/wiki/Q1058438","display_name":"Risk assessment","level":2,"score":0.4690000116825104},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.4643000066280365},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.4595000147819519},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4530999958515167},{"id":"https://openalex.org/C2780771206","wikidata":"https://www.wikidata.org/wiki/Q3271761","display_name":"Safeguard","level":2,"score":0.42250001430511475},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.3671000003814697},{"id":"https://openalex.org/C32896092","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Risk management","level":2,"score":0.350600004196167},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.3433000147342682},{"id":"https://openalex.org/C549605437","wikidata":"https://www.wikidata.org/wiki/Q1229911","display_name":"Food security","level":3,"score":0.32190001010894775},{"id":"https://openalex.org/C3017944768","wikidata":"https://www.wikidata.org/wiki/Q1450463","display_name":"Poison control","level":2,"score":0.2630999982357025}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.01444","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01444","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.01444","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01444","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/2","display_name":"Zero hunger","score":0.5887482166290283}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"are":[4],"increasingly":[5],"deployed":[6],"for":[7],"everyday":[8],"tasks,":[9],"including":[10],"food":[11,17,47,81],"preparation":[12],"and":[13,38,72,84,91,98,140],"health-related":[14],"guidance.":[15],"However,":[16],"safety":[18,39,71,82,112],"remains":[19],"a":[20,78,121,156,169],"high-stakes":[21],"domain":[22],"where":[23],"inaccurate":[24],"or":[25],"misleading":[26],"information":[27],"can":[28],"cause":[29],"severe":[30],"real-world":[31],"harm.":[32],"Despite":[33],"these":[34,150,164],"risks,":[35],"current":[36,108],"LLMs":[37,97,109,129,179],"guardrails":[40,147],"lack":[41],"rigorous":[42],"alignment":[43,113],"tailored":[44],"to":[45,68,120,154,177],"domain-specific":[46,151],"hazards.":[48],"To":[49,162],"address":[50],"this":[51],"gap,":[52],"we":[53,93,166],"introduce":[54,167],"FoodGuardBench,":[55],"the":[56,70,115],"first":[57],"comprehensive":[58],"benchmark":[59],"comprising":[60],"3,339":[61],"queries":[62],"grounded":[63],"in":[64,114],"FDA":[65],"guidelines,":[66],"designed":[67],"evaluate":[69,95],"robustness":[73],"of":[74,80,159],"LLMs.":[75],"By":[76],"constructing":[77],"taxonomy":[79],"principles":[83],"employing":[85],"representative":[86],"jailbreak":[87,124],"attacks":[88],"(e.g.,":[89],"AutoDAN":[90],"PAP),":[92],"systematically":[94,148],"existing":[96,145],"guardrails.":[99],"Our":[100],"evaluation":[101],"results":[102],"reveal":[103],"three":[104],"critical":[105],"vulnerabilities:":[106],"First,":[107],"exhibit":[110],"sparse":[111],"food-related":[116,181],"domain,":[117],"easily":[118],"succumbing":[119],"few":[122],"canonical":[123],"strategies.":[125],"Second,":[126],"when":[127],"compromised,":[128],"frequently":[130],"generate":[131],"actionable":[132],"yet":[133],"harmful":[134],"instructions,":[135],"inadvertently":[136],"empowering":[137],"malicious":[138,160],"actors":[139],"posing":[141],"tangible":[142],"risks.":[143],"Third,":[144],"LLM-based":[146],"overlook":[149],"threats,":[152],"failing":[153],"detect":[155],"substantial":[157],"volume":[158],"inputs.":[161],"mitigate":[163],"vulnerabilities,":[165],"FoodGuard-4B,":[168],"specialized":[170],"guardrail":[171],"model":[172],"fine-tuned":[173],"on":[174],"our":[175],"datasets":[176],"safeguard":[178],"within":[180],"domains.":[182]},"counts_by_year":[],"updated_date":"2026-04-04T06:15:33.020886","created_date":"2026-04-04T00:00:00"}
