{"id":"https://openalex.org/W7133496794","doi":"https://doi.org/10.48550/arxiv.2603.02588","title":"ExpGuard: LLM Content Moderation in Specialized Domains","display_name":"ExpGuard: LLM Content Moderation in Specialized Domains","publication_year":2026,"publication_date":"2026-03-03","ids":{"openalex":"https://openalex.org/W7133496794","doi":"https://doi.org/10.48550/arxiv.2603.02588"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.02588","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02588","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.02588","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128047141","display_name":"Minseok Choi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Choi, Minseok","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100393166","display_name":"Dong-Jin Kim","orcid":"https://orcid.org/0009-0001-6780-245X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Dongjin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100825761","display_name":"Seungbin Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Seungbin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128123503","display_name":"Subin Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Subin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128075363","display_name":"Youngjun Kwak","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kwak, Youngjun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124078737","display_name":"Juyoung Oh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oh, Juyoung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Choo, Jaegul","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choo, Jaegul","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128108663","display_name":"Jungmin Son","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Son, Jungmin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5128047141"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9521999955177307,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9521999955177307,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.006599999964237213,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.006000000052154064,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.7530999779701233},{"id":"https://openalex.org/keywords/jargon","display_name":"Jargon","score":0.5127999782562256},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5044999718666077},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.44920000433921814},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4007999897003174},{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.39340001344680786},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3677999973297119},{"id":"https://openalex.org/keywords/agile-software-development","display_name":"Agile software development","score":0.3199000060558319}],"concepts":[{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.7530999779701233},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5945000052452087},{"id":"https://openalex.org/C2777611551","wikidata":"https://www.wikidata.org/wiki/Q17951","display_name":"Jargon","level":2,"score":0.5127999782562256},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5044999718666077},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.44920000433921814},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4007999897003174},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.39340001344680786},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3677999973297119},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.36500000953674316},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.3513000011444092},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3269999921321869},{"id":"https://openalex.org/C14185376","wikidata":"https://www.wikidata.org/wiki/Q30232","display_name":"Agile software development","level":2,"score":0.3199000060558319},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.2944999933242798},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.2913999855518341},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C2777310092","wikidata":"https://www.wikidata.org/wiki/Q1410600","display_name":"Rebuttal","level":2,"score":0.26669999957084656},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C137176749","wikidata":"https://www.wikidata.org/wiki/Q4105337","display_name":"Psychological resilience","level":2,"score":0.2590000033378601},{"id":"https://openalex.org/C195094911","wikidata":"https://www.wikidata.org/wiki/Q14167904","display_name":"Process management","level":1,"score":0.25609999895095825},{"id":"https://openalex.org/C140547941","wikidata":"https://www.wikidata.org/wiki/Q7797194","display_name":"Threat model","level":2,"score":0.2529999911785126},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2524000108242035},{"id":"https://openalex.org/C172191483","wikidata":"https://www.wikidata.org/wiki/Q1071806","display_name":"Provisioning","level":2,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.02588","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02588","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.02588","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02588","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,157,205],"growing":[2],"deployment":[3],"of":[4,207],"large":[5],"language":[6],"models":[7,33,169],"(LLMs)":[8],"in":[9,53,177,182],"real-world":[10],"applications,":[11],"establishing":[12],"robust":[13,67,209],"safety":[14,29],"guardrails":[15],"to":[16,25,28,42,73,131,163,175,200],"moderate":[17],"their":[18],"inputs":[19],"and":[20,44,56,68,78,83,103,121,137,145,180,189,196,203],"outputs":[21],"has":[22],"become":[23],"essential":[24],"ensure":[26],"adherence":[27],"policies.":[30],"Current":[31],"guardrail":[32,70,210],"predominantly":[34],"address":[35,60],"general":[36],"human-LLM":[37],"interactions,":[38],"rendering":[39],"LLMs":[40],"vulnerable":[41],"harmful":[43,76],"adversarial":[45,165],"content":[46],"within":[47],"domain-specific":[48,138,164],"contexts,":[49],"particularly":[50],"those":[51],"rich":[52],"technical":[54,136],"jargon":[55],"specialized":[57,69],"concepts.":[58],"To":[59,185],"this":[61],"limitation,":[62],"we":[63,88,191],"introduce":[64],"ExpGuard,":[65],"a":[66,91,123],"model":[71,119,133],"designed":[72],"protect":[74],"against":[75,135],"prompts":[77,98],"responses":[79],"across":[80,156],"financial,":[81],"medical,":[82],"legal":[84],"domains.":[85],"In":[86],"addition,":[87],"present":[89],"ExpGuardMix,":[90],"meticulously":[92],"curated":[93],"dataset":[94,111],"comprising":[95],"58,928":[96],"labeled":[97],"paired":[99],"with":[100],"corresponding":[101],"refusal":[102],"compliant":[104],"responses,":[105],"from":[106],"these":[107],"specific":[108],"sectors.":[109],"This":[110],"is":[112],"divided":[113],"into":[114],"two":[115],"subsets:":[116],"ExpGuardTrain,":[117],"for":[118],"training,":[120],"ExpGuardTest,":[122],"high-quality":[124],"test":[125],"set":[126],"annotated":[127],"by":[128,173],"domain":[129],"experts":[130],"evaluate":[132],"robustness":[134],"content.":[139],"Comprehensive":[140],"evaluations":[141],"conducted":[142],"on":[143],"ExpGuardTest":[144],"eight":[146],"established":[147],"public":[148],"benchmarks":[149],"reveal":[150],"that":[151],"ExpGuard":[152],"delivers":[153],"competitive":[154],"performance":[155],"board":[158],"while":[159],"demonstrating":[160],"exceptional":[161],"resilience":[162],"attacks,":[166],"surpassing":[167],"state-of-the-art":[168],"such":[170],"as":[171],"WildGuard":[172],"up":[174],"8.9%":[176],"prompt":[178],"classification":[179],"15.3%":[181],"response":[183],"classification.":[184],"encourage":[186],"further":[187],"research":[188],"development,":[190],"open-source":[192],"our":[193],"code,":[194],"data,":[195],"model,":[197],"enabling":[198],"adaptation":[199],"additional":[201],"domains":[202],"supporting":[204],"creation":[206],"increasingly":[208],"models.":[211]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-03-05T00:00:00"}
