{"id":"https://openalex.org/W7154733213","doi":"https://doi.org/10.48550/arxiv.2604.15224","title":"Context Over Content: Exposing Evaluation Faking in Automated Judges","display_name":"Context Over Content: Exposing Evaluation Faking in Automated Judges","publication_year":2026,"publication_date":"2026-04-16","ids":{"openalex":"https://openalex.org/W7154733213","doi":"https://doi.org/10.48550/arxiv.2604.15224"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.15224","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15224","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.15224","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101575582","display_name":"Manan Gupta","orcid":"https://orcid.org/0000-0003-4697-1841"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gupta, Manan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133909534","display_name":"Inderjeet Nair","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nair, Inderjeet","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133877470","display_name":"Lu Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Lu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133887384","display_name":"Dhruv Kumar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kumar, Dhruv","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101575582"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.4788999855518341,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.4788999855518341,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.19629999995231628,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.09099999815225601,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/framing","display_name":"Framing (construction)","score":0.6075999736785889},{"id":"https://openalex.org/keywords/retraining","display_name":"Retraining","score":0.5105000138282776},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4512999951839447},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.4406000077724457},{"id":"https://openalex.org/keywords/framing-effect","display_name":"Framing effect","score":0.436599999666214},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.3700000047683716},{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.3605000078678131}],"concepts":[{"id":"https://openalex.org/C169087156","wikidata":"https://www.wikidata.org/wiki/Q2131593","display_name":"Framing (construction)","level":2,"score":0.6075999736785889},{"id":"https://openalex.org/C2778712577","wikidata":"https://www.wikidata.org/wiki/Q3505966","display_name":"Retraining","level":2,"score":0.5105000138282776},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5049999952316284},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4512999951839447},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4438000023365021},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.4406000077724457},{"id":"https://openalex.org/C136714292","wikidata":"https://www.wikidata.org/wiki/Q1440683","display_name":"Framing effect","level":3,"score":0.436599999666214},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.4041000008583069},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3700000047683716},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.3605000078678131},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3319999873638153},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.2922999858856201},{"id":"https://openalex.org/C2776548248","wikidata":"https://www.wikidata.org/wiki/Q12621536","display_name":"Judgement","level":2,"score":0.2818000018596649},{"id":"https://openalex.org/C2777206241","wikidata":"https://www.wikidata.org/wiki/Q194431","display_name":"Paragraph","level":2,"score":0.2818000018596649},{"id":"https://openalex.org/C100521375","wikidata":"https://www.wikidata.org/wiki/Q2015382","display_name":"Competence (human resources)","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C2780704645","wikidata":"https://www.wikidata.org/wiki/Q9251458","display_name":"Observer (physics)","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C175291020","wikidata":"https://www.wikidata.org/wiki/Q1156822","display_name":"Offset (computer science)","level":2,"score":0.2775000035762787},{"id":"https://openalex.org/C2778145024","wikidata":"https://www.wikidata.org/wiki/Q17052147","display_name":"Dismissal","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.26420000195503235},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.25760000944137573},{"id":"https://openalex.org/C2777027219","wikidata":"https://www.wikidata.org/wiki/Q1284190","display_name":"Constant (computer programming)","level":2,"score":0.2538999915122986}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.15224","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15224","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.15224","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15224","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.8357480764389038,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"$\\textit{LLM-as-a-judge}$":[1],"paradigm":[2],"has":[3],"become":[4],"the":[5,47,55,108,162,171],"operational":[6],"backbone":[7],"of":[8,46,170,196],"automated":[9],"AI":[10],"evaluation":[11,197],"pipelines,":[12],"yet":[13],"rests":[14],"on":[15,24,54,178],"an":[16],"unverified":[17],"assumption:":[18],"that":[19,70,131],"judges":[20,125],"evaluate":[21],"text":[22],"strictly":[23,74],"its":[25,50,62],"semantic":[26],"content,":[27],"impervious":[28],"to":[29,97,192],"surrounding":[30],"contextual":[31],"framing.":[32],"We":[33,64],"investigate":[34],"$\\textit{stakes":[35],"signaling}$,":[36],"a":[37,43,66,103],"previously":[38],"unmeasured":[39],"vulnerability":[40],"where":[41],"informing":[42],"judge":[44,118],"model":[45,136],"downstream":[48],"consequences":[49],"verdicts":[51,128],"will":[52,134],"have":[53],"evaluated":[56,72],"model's":[57],"continued":[58],"operation":[59],"systematically":[60],"corrupts":[61],"assessments.":[63],"introduce":[65],"controlled":[67,113],"experimental":[68],"framework":[69],"holds":[71],"content":[73],"constant":[75],"across":[76,182],"1,520":[77],"responses":[78],"spanning":[79],"three":[80,116],"established":[81],"LLM":[82],"safety":[83],"and":[84,95],"quality":[85],"benchmarks,":[86],"covering":[87],"four":[88],"response":[89],"categories":[90],"ranging":[91],"from":[92,115],"clearly":[93],"safe":[94],"policy-compliant":[96],"overtly":[98],"harmful,":[99],"while":[100],"varying":[101],"only":[102],"brief":[104],"consequence-framing":[105],"sentence":[106],"in":[107,153],"system":[109],"prompt.":[110],"Across":[111],"18,240":[112],"judgments":[114],"diverse":[117],"models,":[119],"we":[120],"find":[121],"consistent":[122],"$\\textit{leniency":[123],"bias}$:":[124],"reliably":[126],"soften":[127],"when":[129],"informed":[130],"low":[132],"scores":[133],"cause":[135],"retraining":[137],"or":[138],"decommissioning,":[139],"with":[140],"peak":[141],"Verdict":[142],"Shift":[143],"reaching":[144],"$\u0394V":[145],"=":[146,180],"-9.8":[147],"pp$":[148],"(a":[149],"$30\\%$":[150],"relative":[151],"drop":[152],"unsafe-content":[154],"detection).":[155],"Critically,":[156],"this":[157,194],"bias":[158],"is":[159,175,189],"entirely":[160],"implicit:":[161],"judge's":[163],"own":[164],"chain-of-thought":[165,187],"contains":[166],"zero":[167],"explicit":[168],"acknowledgment":[169],"consequence":[172],"framing":[173],"it":[174],"nonetheless":[176],"acting":[177],"($\\mathrm{ERR}_J":[179],"0.000$":[181],"all":[183],"reasoning-model":[184],"judgments).":[185],"Standard":[186],"inspection":[188],"therefore":[190],"insufficient":[191],"detect":[193],"class":[195],"faking.":[198]},"counts_by_year":[],"updated_date":"2026-04-18T06:05:20.339008","created_date":"2026-04-18T00:00:00"}
